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A = pGRN144 
B = pSEAP2-Basic 
C= BGL2-EC047III fragment from A 
into BGL2-NRU1 sites of B 
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GGACCCGGCGGCTTTCCGCGCGCTGGTGGCCCAGTGCCTGGTGTGCGTGCCCTGGGACGC 
CCTGGGCCGCCGAAAGGCGCGCGACCACCGGGTCACGGACCACACGCACGGGACCCTGCG 



NFkB_CSl 
GGGRQTYYQC 
NFkB-MHC-I . 2 
TGGGCTTCCCC 

ACGGCCGCCCCCCGCCGCCCCCTCCTTCCGCCAGGTGGGCCTCCCCGGGGTCGGCGTCCG 
TGCCGGCGGGGGGCGGCGGGGGAGGAAGGCGGTCCACCCGGAGGGGCCCCAGCCGCAGGC 

Intronl 

GCTGGGGTTGAGGGCGGCCGGGGGGAACCAGCGACATGCGGAGAGCAGCGCAGGCGACTC 
CGACCCCAACTCCCGCCGGCCCCCCTTGGTCGCTGTACGCCTCTCGTCGCGTCCGCTGAG 

NFkB_CSl 
GGGRQTYYQC 
NFkB_CS2 
RGGGRMTYYCC 

Topo_II_cleavage_site 
RNYNNCNNGYNGKTNYNY 

AGGGCGCTTCCCCCGCAGGTGTCCTGCCTGAAGGAGCTGGTGGCCCGAGTGCTGCAGAGG 
TCCCGCGAAGGGGGCGTCCACAGGACGGACTTCCTCGACCACCGGGCTCACGACGTCTCC 



FIG. 12 
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GAAGGAACTC 
AGTCAACGAT 
ATGAACCTCG 
GATCACTTTC 
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CGATGGATAT 
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CAAGTTGGAC 
ATATGATAGT 
AATTACTTTC 
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AGATTATTTT 
ATCCAACCTT 
AAGAAAACAT 
TAACTTACTT 
TTAATGGGAA 
GTTTCATCAA 
CTTAGGATTC 
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ATATTAATTA 
AATCATGGCA 
TAAAACGTTG 
CTCAAAGTCA 
AATATTGTTG 
TGCAAGAAAA 
AATGCTTAGT 
CTT CAATGAT 
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TTGGAAATAT 
CAAAACCTAA 
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TTATAAAGAT 
CTACTCCACG 
GAAGTATTTT 
TGAACTTCTT 
TTGGATTTCA 
GCTCTTTCAA 
T AGAG C AATG 
T AAT ATT CCA 
AACGTTTTTG 
AGGTGGAGCA 
ACAATGTCAA 
AATTGGAATA 
TAATAGAAAT 
ACAATATTTC 
AGATTTAATA 
TGCCTACATG 
CAAAATCTTG 
GAAAACTTGA 
GCTGTTTAGC 
AATTTTTCTA 
AAGAATTTTC 
ACTCATTCAC 
C ATGGATG C A 
GAAAACATCT 
CGTCGTCTCG 
GTTACTCCAA 
AAAATGTCAA 
AAAAGAGGTT 
TCAGACTAAT 
AAGAAGATTG 
GAAGTTATTG 
TTAAAGATCC 
AAGTATGAGG 
CTTCTTTGCA 
AAAAACTATC 
TGGATTATGA 
TTCGAAAAAC 
T C CAG AAG AT 
CTTGAAAATG 
AGCAAAGCAA 
TTAATATTTG 
CAAACAAAAG 
ATTTTATTAT 
AATCAATGAA 



FIG. 13A 



+ 




14/103 



24 01 CCCTGAAAAT 

24 51 TTTTGATTAC 

2 5 01 ATAAACGTAA 

2 551 GACTAGTTTT 

26 01 GTGTTGAGGA 

26 51 TCAATTGATA 

27 01 AGAAGGAATT 
2 751 CAATGTGGCT 

28 01 CATTATTTTA 
28 51 CAACAAGTTA 
2 9 01 AATACAAGGA 

2 951 T T AGAGGT AT 

3 0 01 CCTTGTGTGC 
3 051 ACTTTTTCCT 
3101 AAGTACATTT 
3151 GCTAAAAAGT 
32 01 CTATTCTAAC 
3 2 51 TGGGGTTTTG 



CCAAATGTTA 
AACTCAAGAG 
GTCGTGAAAA 
CCATTAAGTC 
GCAAAATATT 
TGAAAACTCT 
CTGTGTACAC 
CAAGAAGAAA 
GAAAGACGAT 
TTTATATCAG 
CCACTTTAAG 
CTAAAATTAT 
AAT AT TAAGG 
TAGCACACTG 
TCAACAGAGT 
GACCAATGTC 
TTATTTTGGA 
GGGTTTTGGG 



ATCTTCTAAT 
AATAATGCAG 
TGGATTTAAA 
CAAGCAAATT 
GTTCAAGATT 
TGCTTTAATG 
TCAATCTAAA 
CTAAAGTCGT 
TACAACCGAA 
GCGGTTACAA 
AAGAACTTAG 
ATACTCTGTA 
ATACAATTTT 
AAGCACTTTA 
TTGCATGATC 
AATCTCTAAT 
AAGTTAATTT 
GTTTTGGGG 



GAGACTTACA 
TATTGTTTAT 
TTCAATATGA 
TGCAAAATAC 
ACTGCGATTG 
CCAAATATTA 
CATGCAAACA 
TTTTAATGAA 
GACTTTGCGA 
ATACATGCAA 
CTATGAGCAG 
ACCAGAGCAT 
TGGAGAGGAG 
TTGAAATATT 
CTCAAGGCAA 
TCAATATGAT 
TCAATTTTTG 



GATGACTATC 
TGAGAAACTT 
AGAAACTACA 
GGAATGGATA 
GATTGGCATC 
ACTTGAGAAT 
AAG AAAG CAT 
TAACATTACC 
ATAAAACTCT 
TGAGC C AAAG 
TATGATCGAC 
TCTTTAAATA 
CAT TAT C C AG 
CAGCACAAAA 
AAGAAGCAAA 
GCATAGTCGA 
TCTTATATAC 
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KNNIVIDSKN 
KKTL I VEAKQ 
VSSILSSFYY 
NNAVLFIEKL 
VQDYCDWIGI 
LKSFLMNNIT 
KNLAMSSMID 
KHFIEIFSTK 
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1 gcagcgctgc gtcctgctgc gcacgtggga 
61 gcgcgctccc cgctgccgag ccgtgcgctc 
121 gccgctggcc acgttcgtgc ggcgcctggg 
181 ggacccggcg gctttccgcg cgctggtggc 
241 acggccgccc cccgccgccc cctccttccg 
3 01 ccgagtgctg cagaggctgt gcgagcgcgg 

3 61 gctgctggac ggggcccgcg ggggcccccc 
421 cctgcccaac acggtgaccg acgcactgcg 

4 81 ccgcgtgggc gacgacgtgc tggttcacct 
541 ggctcccagc tgcgcctacc aggtgtgcgg 
601 tcaggcccgg cccccgccac acgctagtgg 
661 ctggaaccat agcgtcaggg aggccggggt 
721 gaggcgcggg ggcagtgcca gccgaagtct 
781 tgcccctgag ccggagcgga cgcccgttgg 
841 gcgtggaccg agtgaccgtg gtttctgtgt 
901 cacctctttg gagggtgcgc tctctggcac 
961 gcaccacgcg ggccccccat ccacatcgcg 

1021 cccggtgtac gccgagacca agcacttcct 
1081 gccctccttc ctactcagct ctctgaggcc 
1141 gaccatcttt ctgggttcca ggccctggat 
1201 gccccagcgc tactggcaaa tgcggcccct 
1261 gtgcccctac ggggtgctcc tcaagacgca 
1321 agccggtgtc tgtgcccggg agaagcccca 
1381 cacagacccc cgtcgcctgg tgcagctgct 
1441 cggcttcgtg cgggcctgcc tgcgccggct 
1501 caacgaacgc cgcttcctca ggaacaccaa 
1561 gctctcgctg caggagctga cgtggaagat 
1621 gagcccaggg gttggctgtg ttccggccgc 
1681 caagttcctg cactggctga tgagtgtgta 
1741 tgtcacggag accacgtttc aaaagaacag 
1801 caagttgcaa agcattggaa tcagacagca 
1861 ggaagcagag gtcaggcagc atcgggaagc 
1921 cttcatcccc aagcctgacg ggctgcggcc 
1981 cagaacgttc cgcagagaaa agagggccga 

2 041 cagcgtgctc aactacgagc gggcgcggcg 
2101 cctggacgat atccacaggg cctggcgcac 
2161 gccgcctgag ctgtactttg tcaaggtgga 
2221 ggacaggctc acggaggtca tcgccagcat 
2281 tcggtatgcc gtggtccaga aggccgccca 
2341 cgtctctacc ttgacagacc tccagccgta 
2401 gaccagcccg ctgagggatg ccgtcgtcat 
2461 cagtggcctc ttcgacgtct tcctacgctt 
2521 caagtcctac gtccagtgcc aggggatccc 
2581 cagcctgtgc tacggcgaca tggagaacaa 
2641 gctcctgcgt ttggtggatg atttcttgtt 
2701 cttcctcagg accctggtcc gaggtgtccc 
2761 gacagtggtg aacttccctg tagaagacga 
2821 gccggcccac ggcctattcc cctggtgcgg 
2881 gcagagcgac tactccagct atgcccggac 
2941 cggcttcaag gctgggagga acatgcgtcg 
3001 tcacagcctg tttctggatt tgcaggtgaa 
3061 caagatcctc ctgctgcagg cgtacaggtt 
3121 tcagcaagtt tggaagaacc ccacattttt 
3181 ctgctactcc atcctgaaag ccaagaacgc 
3241 cggccctctg ccctccgagg ccgtgcagtg 
3301 gactcgacac cgtgtcacct acgtgccact 
3361 gctgagtcgg aagctcccgg ggacgacgct 
3421 actgccctca gacttcaaga ccatcctgga 
3481 gagcagacac cagcagccct gtcacgccgg 
3541 cacacccagg cccgcaccgc tgggagtctg 
3601 catgtccggc tgaaggctga gtgtccggct 
3661 gagtgtccag cacacctgcc gtcttcactt 
3721 gggccagctt ttcctcacca ggagcccggc 
3781 ccagattcgc cattgttcac ccctcgccct 

3 841 aggtggagac cctgagaagg accctgggag 
3901 ccctgtacac aggcgaggac cctgcacctg 
3 961 gaggtgctgt gggagtaaaa tactgaatat 



agccctggcc ccggccaccc ccgcgatgcc 
cctgctgcgc agccactacc gcgaggtgct 
gccccagggc tggcggctgg tgcagcgcgg 
ccagtgcctg gtgtgcgtgc cctgggacgc 
ccaggtgtcc tgcctgaagg agctggtggc 
cgcgaagaac gtgctggcct tcggcttcgc 
cgaggccttc accaccagcg tgcgcagcta 
9Sggagcggg gcgtgggggc tgctgctgcg 
gctggcacgc tgcgcgctct ttgtgctggt 
gccgccgctg taccagctcg gcgctgccac 
accccgaagg cgtctgggat gcgaacgggc 
ccccctgggc ctgccagccc cgggtgcgag 
gccgttgccc aagaggccca ggcgtggcgc 
gcaggggtcc tgggcccacc cgggcaggac 
ggtgtcacct gccagacccg ccgaagaagc 
gcgccactcc cacccatccg tgggccgcca 
gccaccacgt ccctgggaca cgccttgtcc 
ctactcctca ggcgacaagg agcagctgcg 
cagcctgact ggcgctcgga ggctcgtgga 
gccagggact ccccgcaggt tgccccgcct 
gtttctggag ctgcttggga accacgcgca 
ctgcccgctg cgagctgcgg tcaccccagc 
gggctctgtg gcggcccccg aggaggagga 
ccgccagcac agcagcccct ggcaggtgta 
ggtgccccca ggcctctggg gctccaggca 
gaagttcatc tccctgggga agcatgccaa 
gagcgtgcgg gactgcgctt ggctgcgcag 
agagcaccgt ctgcgtgagg agatcctggc 
cgtcgtcgag ctgctcaggt ctttctttta 
gctctttttc taccggaaga gtgtctggag 
cttgaagagg gtgcagctgc gggagctgtc 
caggcccgcc ctgctgacgt ccagactccg 
gattgtgaac atggactacg tcgtgggagc 
gcgtctcacc tcgagggtga aggcactgtt 
ccccggcctc ctgggcgcct ctgtgctggg 
cttcgtgctg cgtgtgcggg cccaggaccc 
tgtgacgggc gcgtacgaca ccatccccca 
catcaaaccc cagaacacgt actgcgtgcg 
tgggcacgtc cgcaaggcct tcaagagcca 
catgcgacag ttcgtggctc acctgcagga 
cgagcagagc tcctccctga atgaggccag 
catgtgccac cacgccgtgc gcatcagggg 
gcagggctcc atcctctcca cgctgctctg 
gctgtttgcg gggattcggc gggacgggct 
ggtgacacct cacctcaccc acgcgaaaac 
tgagtatggc tgcgtggtga acttgcggaa 
ggccctgggt ggcacggctt ttgttcagat 
cctgctgctg gatacccgga ccctggaggt 
ctccatcaga gccagtctca ccttcaaccg 
caaactcttt ggggtcttgc ggctgaagtg 
cagcctccag acggtgtgca ccaacatcta 
tcacgcatgt gtgctgcagc tcccatttca 
cctgcgcgtc atctctgaca cggcctccct 
agggatgtcg ctgggggcca agggcgccgc 
gctgtgccac caagcattcc tgctcaagct 
cctggggtca ctcaggacag cccagacgca 
gactgccctg gaggccgcag ccaacccggc 
ctgatggcca cccgcccaca gccaggccga 
gctctacgtc ccagggaggg aggggcggcc 
aggcctgagt gagtgtttgg ccgaggcctg 
gaggcctgag cgagtgtcca gccaagggct 
ccccacaggc tggcgctcgg ctccacccca 
ttccactccc cacataggaa tagtccatcc 
gccctccttt gccttccacc cccaccatcc 
ctctgggaat ttggagtgac caaaggtgtg 
gatgggggtc cctgtgggtc aaattggggg 
atgagttttt cagttttgaa aaaaa 
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MPRAPRCRAVRSLLRSHYREVLPLATFVRRLGPQGWRLVQRGDP 
AAFRALVAQCLVCVPWDARPPPAAPSFRQVSCLKELVARVLQRL 
CERGAKNVLAFGFALLDGARGGPPEAFTTSVRSYLPNTVTDALR 
GSGAWGLLLRRVGDDVLVHLLARCALFVLVAPSCAYQVCGPPLY 
QLGAATQARPPPHASGPRRRLGCERAWNHSVREAGVPLGLPAPG 
ARRRGGSASRSLPLPKRPRRGAAPEPERTPVGQGSWAHPGRTRG 
P S DRGFCWS PAR PAE EAT S L EG AL S GTRHS H P S VGRQHHAG P P 
STSRPPRPWDTPCPPVYAETKHFLYSSGDKEQLRPSFLLSSLRP 
SLTGARRLVETIFLGSRPWMPGTPRRLPRLPQRYWQMRPLFLEL 
LGNHAQCPYGVLLKTHCPLRAAVTPAAGVCAREKPQGSVAAPEE 
EDTDPRRLVQLLRQHSSPWQVYGFVRACLRRLVPPGLWGSRHNE 
RRFLRNTKKFISLGKHAKLSLQELTWKMSVRDCAWLRRSPGVGC 
VPAAEHRLREE I LAKFLHWLMS VYVVELLRS FF YVTETTFQKNR 
LFFYRKSVWSKLQSIGIRQHLKRVQLRELSEAEVRQHREARPAL 
LTSRLRFIPKPDGLRPIVNMDYWGARTFRREKRAERLTSRVKA 
LFSVLNYERARRPGLLGASVLGLDDIHRAWRTFVLRVRAQDPPP 
ELYFVKVDVTGAYDTI PQDRLTEVI AS 1 1 KPQNTYCVRRYAWQ 
KAAHGHVRKAFKSHVSTLTDLQPYMRQFVAHLQETSPLRDAWI 
EQSSSLNEASSGLFDVFLRFMCHHAVRIRGKS YVQCQGI PQGS I 
LSTLLCSLCYGDMENKLFAGIRRDGLLLRLVDDFLLVTPHLTHA 
KTFLRTLVRGVPEYGCWNLRKTWNFPVEDEALGGTAFVQMPA 
HGLFPWCGLLLDTRTLEVQSDYSSYARTSIRASLTFNRGFKAGR 
NMRRKLFGVLRLKCHSLFLDLQVNSLQTVCTNIYKILLLQAYRF 
HACVLQL P FHQQVWKN PTFFLRV I SDTAS LC YS I h KAKNAGMS L 
GAKGAAGPLPSEAVQWLCHQAFLLKLTRHRVTYVPLLGSLRTAQ 
TQLSRKLPGTTLTALEAAANPALPSDFKTILD 

FIG. 17 

GGCCAAGTTCCTGCACTGGCTGATGAGTGTGTACGTCGTCGAGCTGCTCAGGTCTTTCTT 
TTATGTCACGGAGACCACGTTTCAAAAGAACAGGCTCTTTTTCTACCGGAAGAGTGTCTG 
GAGCAAGTTGCAAAGCATTGGAATCAGACAGCACTTGAAGAGGGTGCAGCTGCGGGAGCT 
GTCGGAAGCAGAGGTCAGGCAGCATCGGGAAGCCAGGCCCGCCCTGCTGACGTCCAGACT 
CCGCTTCATCCCCAAGCCTGACGGGCTGCGGCCGATTGTGAACATGGACTACGTCGTGGG 
AGCCAGAACGTTCCGCAGAGAAAAGAGGGCCGAGCGTCTCACCTCGAGGGTGAAGGCACT 
GTTCAGCGTGCTCAACTACGAGCGGGCGCGGCGCCCCGGCCTCCTGGGCGCCTCTGTGCT 
GGGCCTGGACGATATCCACAGGGCCTGGCGCACCTTCGTGCTGCGTGTGCGGGCCCAGGA 
CCCGCCGCCTGAGCTGTACTTTGTCAAGGTGGATGTGACGGGCGCGTACGACACCATCCC 
CCAGGACAGGCTCACGGAGGTCATCGCCAGCATCATCAAACCCCAGAACACGTACTGCGT 
GCGTCGGTATGCCGTGGTCCAGAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAGAG 
CCACGTCCTACGTCCAGTGCCAGGGGATCCCGCAGGGCTCCATCCTCTCCACGCTGCTCT 
GCAGCCTGTGCTACGGCGACATGGAGAACAAGCTGTTTGCGGGGATTCGGCGGGACGGGC 
TGCTCCTGCGTTTGGTGGATGATTTCTTGTTGGTGACACCTCACCTCACCCACGCGAAAA 
CCTTCCTCAGGACCCTGGTCCGAGGTGTCCCTGAGTATGGCTGCGTGGTGAACTTGCGGA 
AGACAGTGGTGAACTTCCCTGTA 4 GAAGACGAGGCCCTGGGTGGCACGGCTTTTGTTCAGA 
TGCCGGCCCACGGCCTATTCCCCTGGTGCGGCCTGCTGCTGGATACCCGGACCCTGGAGG 
TGCAGAGCGACTACTCCAGCTATGCCCGGACCTCCATCAGAGCCAGTCTCACCTTCAACC 
GCGGCTTCAAGGCTGGGAGGAACATGCGTCGCAAACTCTTTGGGGTCTTGCGGCTGAAGT 
GTCACAGCCTGTTTCTGGAT.TTGCAGGTGAACAGCCTCCAGACGGTGTGCACCAACATCT 
ACAAGATCCTCCTGCTGCAGGCGTACAGGTTTCACGCATGTGTGCTGCAGCTCCCATTTC 
ATCAGCAAGTTTGGAAGAACCCCACATTTTTCCTGCGCGTCATCTCTGACACGGCCTCCC 
TCTGCTACTCCATCCTGAAAGCCAAGAACGCAGGGATGTCGCTGGGGGCCAAGGGCGCCG 
CCGGCC7TCTGCCCTCCGAGGCCGTGCAGTGGCTGTGCCACCAAGCATTCCTGCTCAAGC 
TGACTCGACACCGTGTCACCTACGTGCCACTCCTGGGGTCACTCAGGACAGCCCAGACGC 
AGCTGAGTCGGAAGCTCCCGGGGACGACGCTGACTGCCCTGGAGGCCGCAGCCAACCCGG 
CACTGCCCTCAGACTTCAAGACCATCCTGGACTGATGGCCACCCGCCCACAGCCAGGCCG 
AGAGCAGACACCAGCAGCCCTGTCACGCCGGGCTCTACGTCCCAGGGAGGGAGGGGCGGC 
CCACACCCAGGCCTGCACCGCTGGGAGTCTGAGGCCTGAGTGAGTGTTTGGCCGAGGCCT 
GCATGTCCGGCTGAAGGCTGAGTGTCCGGCTGAGGCCTGAGCGAGTGTCCAGCCAAGGGC 
TGAGTGTCCAGCACACCTGCCGTCTTCACTTCCCCACAGGCTGGCGCTCGGCTCCACCCC 
AGGGCCAGCTTTTCCTCACCAGGAGCCCGGCTTCCACTCCCCACATAGGAATAGTCCATC 
CCCAGATTCGCCATTGTTCACCCCTCGCCCTGCCCTCCTTTGCCTTCCACCCCCACCATC 
CAGGTGGAGACCCTGAGAAGGACCCTGGGAGCTCTGGGAATTTGGAGTGACCAAAGGTGT 
GCCCTGTACACAGGCGAGGACCCTGCACCTGGATGGGGGTCCCTGTGGGTCAAATTGGGG 
GGAGGTGCTGTGGGAGTAAAATACTGAATATATGAGTTTTTCAGTTTTGOAAAAAAAAAA 
AAAAAAAAAAAAAAAA 
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MetSerValTyrValValGluLeuLeuArgSerPhePhe 
TyrValThrGluThrThrPheGlnLysAsnArgLeuPhe 
PheTyrArgLysSerValTrpSerLysLeuGlnSerlle 
GlylleArgGlnHisLeuLysArgValGlnLeuArgGlu 
LeuSerGluAlaGluValArgGlnHisArgGluAlaArg 
Pr oAl aLeuLeuThr SerArgLeuArgPhe I 1 ePr oLy s 
ProAspGlyLeuArgProIleValAsnMetAspTyrVal 
ValGlyAlaArgThrPheArgArgGluLysArgAlaGlu 
ArgLeuThrSerArgValLysAlaLeuPheSerValLeu 
AsnTyrGluArgAlaArgArgProGlyLeuLeuGlyAla 
SerValLeuGlyLeuAspAspIleHisArgAlaTrpArg 
ThrPheValLeuArgValArgAlaGlnAspProProPro 
GluLeuTyrPheValLysValAspValThrGlyAlaTyr 
AspThr I 1 eProGlnAspArgLeuThrGluVal I 1 eAl a 
SerllelleLysProGlnAsnThrTyrCysValArgArg 
TyrAlaValValGlnLysAlaAlaHisGlyHisValArg 
LysAlaPheLysSerHisValLeuArgProValProGly 
AspProAlaGlyLeuHisProLeuHisAlaAlaLeuGln 
ProValLeuArgArgHisGlyGluGlnAlaValCysGly 
AspSerAlaGlyArgAlaAlaProAlaPheGlyGly 

FIG. 19 

i 

met 

GCAGCGCTGCGTCCTGCTGCGCACGTGGGAAGCCCTGGCCCCGGCCACCCCCGCG ATG 

10 

cys arg ala val arg ser leu leu arg ser 
TGC CGA GCC GTG CGC TCC CTG CTG CGC AGC 

30 

leu pro leu ala thr phe val arg arg leu 
CTG CCG CTG GCC ACG TTC GTG CGG CGC CTG 

40 

arg leu val gin arg gly asp pro ala ala 
CGG CTG GTG CAG CGC GGG GAC CCG GCG GCT 

60 

ala gin cys leu val cys val pro trp asp 
GCC CAG TGC CTG GTG TGC GTG CCC TGG GAC 

70 

ala ala pro ser phe arg gin val ser cys 
GCC GCC CCC TCC TTC CGC CAG GTG TCC TGC 

90 

ala arg val leu gin arg leu cys glu arg 
GCC CGA GTG CTG CAG AGG CTG TGC GAG CGC 

100 

leu ala phe gly phe ala leu leu asp gly 
CTG GCC TTC GGC TTC GCG CTG CTG GAC GGG 

120 

pro glu ala phe thr thr ser val arg ser 
CCC GAG GCC TTC ACC ACC AGC GTG CGC AGC 



pro arg ala pro arg 
CCG CGC GCT CCC CGC 

20 

his tyr arg glu val 
CAC TAC CGC GAG GTG 



gly pro gin gly trp 
GGG CCC CAG GGC TGG 

50 

phe arg ala leu val 
TTC CGC GCG CTG GTG 



ala arg pro pro pro 
GCA CGG CCG CCC CCC 

80 

leu lys glu leu val 
CTG AAG GAG CTG GTG 



gly ala lys asn val 
GGC GCG AAG AAC GTG 

110 

ala arg gly gly pro 
GCC CGC GGG GGC CCC 



FIG. 20A 
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tyr leu pro 
TAC CTG CCC 



trp gly leu 
TGG GGG CTG 



leu leu ala 
CTG CTG GCA 



ala tyr gin 
GCC TAC CAG 



thr gin ala 
ACT CAG GCC 



leu gly cys 
CTG GGA TGC 



val pro leu 
GTC CCC CTG 



ser ala ser 
AGT GCC AGC 



ala ala pro 
GCT GCC CCT 



ala his pro 
GCC CAC CCG 



val val ser 
GTG GTG TCA 



gly ala leu 
GGT GCG CTC 



gin his his 
CAG CAC CAC 



trp asp thr 
TGG GAC ACG 



asn thr val 
AAC ACG GTG 

140 

leu leu arg 
CTG CTG CGC 



arg cys ala 
CGC TGC GCG 

170 

val cys gly 
GTG TGC GGG 



arg pro pro 
CGG CCC CCG 

200 

glu arg ala 
GAA CGG GCC 



gly leu pro 
GGC CTG CCA 

230 

arg ser leu 
CGA AGT CTG 



glu pro glu 
GAG CCG GAG 

260 

gly arg thr 
GGC AGG ACG 



pro ala arg 
CCT GCC AGA 

290 

ser gly thr 
TCT GGC ACG 



ala gly pro 
GCG GGC CCC 

320 

pro cys pro 
CCT TGT CCC 



130 

thr asp ala 
ACC GAC GCA 



arg val gly 
CGC GTG GGC 

160 

leu phe val 
CTC TTT GTG 



pro pro leu 
CCG CCG CTG 

190 

pro his ala 
CCA CAC GCT 



trp asn his 
TGG AAC CAT 

220 

ala pro gly 
GCC CCG GGT 



pro leu pro 
CCG TTG CCC 

250 

arg thr pro 
CGG ACG CCC 



arg gly pro 
CGT GGA CCG 



280 

pro ala glu 
CCC GCC GAA 



arg his ser 
CGC CAC TCC 

310 

pro ser thr 
CCA TCC ACA 



pro val tyr 
CCG GTG TAC 



leu arg gly 
CTG CGG GGG 



asp asp val 
GAC GAC GTG 



leu val ala 
CTG GTG GCT 



tyr gin leu 
TAC CAG CTC 



ser gly pro 
AGT GGA CCC 



ser val arg 
AGC GTC AGG 



ala arg arg 
GCG AGG AGG 



lys arg pro 
AAG AGG CCC 



val gly gin 
GTT GGG CAG 



ser asp arg 
AGT GAC CGT 



glu ala thr 
GAA GCC ACC 



his pro ser 
CAC CCA TCC 



ser arg pro 
TCG CGG CCA 



ala glu thr 
GCC GAG ACC 



ser gly ala 
AGC GGG GCG 

150 
leu val his 
CTG GTT CAC 



pro ser cys 
CCC AGC TGC 

180 
gly ala ala 
GGC GCT GCC 



arg arg arg 
CGA AGG CGT 

210 
glu ala gly 
GAG GCC GGG 



arg gly gly 
CGC GGG GGC 

240 
arg arg gly 
AGG CGT GGC 



gly ser trp 
GGG TCC TGG 

270 
gly phe cys 
GGT TTC TGT 



ser leu glu 
TCT TTG GAG 

300 
val gly arg 
GTG GGC CGC 



pro arg pro 
CCA CGT CCC 

330 
lys his phe 
AAG CAC TTC 
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leu tyr ser 
CTC TAC TCC 



leu ser ser 
CTC AGC TCT 



glu thr ile 
GAG ACC ATC 



arg arg leu 
CGC AGG TTG 



leu phe leu 
CTG TTT CTG 



val leu leu 
GTG CTC CTC 



ala ala gly 
GCA GCC GGT 



ala pro glu 
GCC CCC GAG 



leu arg gin 
CTC CGC CAG 



ala cys leu 
GCC TGC CTG 



his asn glu 
CAC AAC GAA 



leu gly lys 
CTG GGG AAG 



met ser val 
ATG AGC GTG 



gly cys val 
GGC TGT GTT 



ser gly asp 
TCA GGC GAC 

350 

leu arg pro 
CTG AGG CCC 



phe leu gly 
TTT CTG GGT 

380 

pro arg leu 
CCC CGC CTG 



glu leu leu 
GAG CTG CTT 

410 

lys thr his 
AAG ACG CAC 



val cys ala 
GTC TGT GCC 

440 

glu glu asp 
GAG GAG GAC 



his ser ser 
CAC AGC AGC 

470 

arg arg leu 
CGC CGG CTG 



arg arg phe 
CGC CGC TTC 

500 

his ala lys 
CAT GCC AAG 



arg asp cys 
CGG GAC TGC 

530 

pro ala ala 
CCG GCC GCA 



340 

lys glu gin 
AAG GAG CAG 



ser leu thr 
AGC CTG ACT 

370 

ser arg pro 
TCC AGG CCC 



pro gin arg 
CCC CAG CGC 

400 

gly asn his 
GGG AAC CAC 



cys pro leu 
TGC CCG CTG 

430 

arg glu lys 
CGG GAG AAG 



thr asp pro 
ACA GAC CCC 

460 

pro trp gin 
CCC TGG CAG 



val pro pro 
GTG CCC CCA 

490 

leu arg asn 
CTC AGG AAC 



leu ser leu 
CTC TCG CTG 

520 

ala trp leu 
GCT TGG CTG 



glu his arg 
GAG CAC CGT 



leu arg pro 
CTG CGG CCC 



gly ala arg 
GGC GCT CGG 



trp met pro 
TGG ATG CCA 



tyr trp gin 
TAC TGG CAA 



ala gin cys 
GCG CAG TGC 



arg ala ala 
CGA GCT GCG 



pro gin gly 
CCC CAG GGC 



arg arg leu 
CGT CGC CTG 



val tyr gly 
GTG TAC GGC 



gly leu trp 
GGC CTC TGG 



thr lys lys 
ACC AAG AAG 



gin glu leu 
CAG GAG CTG 



arg arg ser 
CGC AGG AGC 



leu arg glu 
CTG CGT GAG 



ser phe leu 
TCC TTC CTA 

360 
arg leu val 
AGG CTC GTG 



gly thr pro 
GGG ACT CCC 

390 
met arg pro 
ATG CGG CCC 



pro tyr gly 
CCC TAC GGG 

420 
val thr pro 
GTC ACC CCA 



ser val ala 
TCT GTG GCG 

450 
val gin leu 
GTG CAG CTG 



phe val arg 
TTC GTG CGG 

480 
gly ser arg 
GGC TCC AGG 



phe ile ser 
TTC ATC TCC 

510 
thr trp lys 
ACG TGG AAG 



pro gly val 
CCA GGG GTT 

540 
glu ile leu 
GAG ATC CTG 
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ala lys phe 
GCC AAG TTC 



1 eu 
CTC 


arg 
AGG 


ser 
TCT 


arg 
AGG 


leu 
CTC 


_ i_ _ 
pne 

TTT 


ile 
ATT 


gly 
GGA 


ile 
ATC 


ser 
i-n pp 


glu 

P 7\ 7\ 

bAA 


ala 

(jCA 


leu 
CTG 


thr 
ACG 


ser 
TCC 


pro 

o op 

CCCj 


ile 
ATT 


val 
GTG 


arg 

A P A 

AvaA 


glu 

A. TV 

bAA 


lys 

7\ A P 

AAva 


phe 

mrpri 


ser 

a pp 
AGC 


val 
crc 


giy 

GGC 


ala 
GCC 


ser 
TCT 


thr 
ACC 


phe 
TTC 


val 
GTG 


tyr 
TAC 


phe 
TTT 


val 
GTC 


gin 

CAG 


asp 
GAC 


arg 
AGG 


asn 
AAC 


thr 
ACG 


tyr 
TAC 



1 eu 
CTG 


hi s 
CAC 


trp 
TGG 


560 
phe 
TTC 


phe 
TTT 


tyr 
TAT 


phe 
TTC 
590 
arg 
AGA 


tyr 
TAC 

gin 
CAG 


arg 
CGG 

his 
CAC 


glu 

par 


val 


arg 


620 
arg 
AGA 


leu 
CTC 


arg 
CGC 


asn 


met 

A TP 


asp 
pap 


650 
arg 
AGG 


ala 
GCC 


glu 
GAG 


leu 


asn 

A A P 

ML 


tyr 

1 AC 


680 
val 
GTG 


leu 
CTG 


giy 

GGC 


leu 
CTG 


arg 
CGT 


val 
GTG 


710 
lys 
AAG 


val 
GTG 


asp 
GAT 


leu 
CTC 


thr 
ACG 


glu 
GAG 


740 
cys 
TGC 


val 
GTG 


arg 
CGT 



leu 
CTG 


met 
ATG 


ser 
AGT 


val 
GTC 


tnr 
ACG 


glu 
GAG 


lys 
AAG 


ser 
AGT 


580 
val 
GTC 


leu 
TTG 


lys 
AAG 


arg 
AGG 


gin 
CAG 


his 
CAT 


610 
arg 
CGG 


phe 

rprpp 


ile 

l\rpp 

Hi L 


pro 
ppp 

CCC 


tyr 
TAC 


val 
GTC 


640 
val 
GTG 


arg 
CGT 


leu 
CTC 


thr 
ACC 


glu 
GAG 


arg 
CGG 


670 
ala 
GCG 


leu 

PTP 


asp 

P7\ p 

CAC 


asp 

CA 1 


arg 
CGG 


ala 
GCC 


700 
gin 
CAG 


val 
GTG 


thr 
ACG 


giy 

GGC 


val 
GTC 


ile 
ATC 


730 
ala 
GCC 


arg 
CGG 


tyr 
TAT 


ala 
GCC 



val tyr val 
GTG TAC GTC 



4- "U. -v- 

unr 
ACC 


4- "Ui -v- 
Llil 

ACG 


phe 
TTT 


crp 
TGG 


ser 
AGC 


lys 
AAG 


val 


gin 
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ser 
AGC 
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ATC 


ile 
ATC 


val 
GTG 


val 
GTC 


gin 
CAG 



val glu leu 
GTC GAG CTG 

570 

gin lys asn 
CAA AAG AAC 



leu gin ser 
TTG CAA AGC 

600 
arg glu leu 
CGG GAG CTG 



pro ala leu 
CCC GCC CTG 

630 
gly leu arg 
GGG CTG CGG 



thr phe arg 
ACG TTC CGC 

660 
lys ala leu 
AAG GCA CTG 



gly leu leu 
GGC CTC CTG 

690 
ala trp arg 
GCC TGG CGC 

pro glu leu 
CCT GAG CTG 

720 
thr ile pro 
ACC ATC CCC 



lys pro gin 
AAA CCC CAG 

750 

lys ala ala 
AAG GCC GCC 
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760 

his gly his val arg lys ala phe lys ser his val leu arg pro 

CAT GGG CAC GTC CGC AAG GCC TTC AAG AGC CAC GTC CTA CGT CCA 

770 780 

val pro gly asp pro ala gly leu his pro leu his ala ala leu 

GTG CCA GGG GAT CCC GCA GGG CTC CAT CCT CTC CAC GCT GCT CTG 



790 

gin pro val leu arg arg his gly glu gin ala val cys gly asp 
CAG CCT GTG CTA CGG CGA CAT GGA GAA CAA GCT GTT TGC GGG GAT 

800 807 
ser ala gly arg ala ala pro ala phe gly gly OP 

TCG GCG GGA CGG GCT GCT CCT GCG TTT GGT GGA TGA TTTCTTGTTGGT 
GACACCTCACCTCACCCACGCGAAAACCTTCCTCAGGACCCTGGTCCGAGGTGTCCCTGA 
GTATGGCTGCGTGGTGAACTTGCGGAAGACAGTGGTGAACTTCCCTGTAGAAGACGAGGC 
CCTGGGTGGCACGGCTTTTGTTCAGATGCCGGCCCACGGCCTATTCCCCTGGTGCGGCCT 
GCTGCTGGATACCCGGACCCTGGAGGTGCAGAGCGACTACTCCAGCTATGCCCGGACCTC 
CATCAGAGCCAGTCTCACCTTCAACCGCGGCTTCAAGGCTGGGAGGAACATGCGTCGCAA 
ACTCTTTGGGGTCTTGCGGCTGAAGTGTCACAGCCTGTTTCTGGATTTGCAGGTGAACAG 
CCTCCAGACGGTGTGCACCAACATCTACAAGATCCTCCTGCTGCAGGCGTACAGGTTTCA 
CGCATGTGTGCTGCAGCTCCCATTTCATCAGCAAGTTTGGAAGAACCCCACATTTTTCCT 
GCGCGTCATCTCTGACACGGCCTCCCTCTGCTACTCCATCCTGAAAGCCAAGAACGCAGG 
GATGTCGCTGGGGGCCAAGGGCGCCGCCGGCCCTCTGCCCTCCGAGGCCGTGCAGTGGCT 
GTGCCACCAAGCATTCCTGCTCAAGCTGACTCGACACCGTGTCACCTACGTGCCACTCCT 
GGGGTCACTCAGGACAGCCCAGACGCAGCTGAGTCGGAAGCTCCCGGGGACGACGCTGAC 
TGCCCTGGAGGCCGCAGCCAACCCGGCACTGCCCTCAGACTTCAAGACCATCCTGGACTG 
ATGGCCACCCGCCCACAGCCAGGCCGAGAGCAGACACCAGCAGCCCTGTCACGCCGGGCT 
CTACGTCCCAGGGAGGGAGGGGCGGCCCACACCCAGGCCCGCACCGCTGGGAGTCTGAGG 
CCTGAGTGAGTGTTTGGCCGAGGCCTGCATGTCCGGCTGAAGGCTGAGTGTCCGGCTGAG 
GCCTGAGCGAGTGTCCAGCCAAGGGCTGAGTGTCCAGCACACCTGCCGTCTTCACTTCCC 
CACAGGCTGGCGCTCGGCTCCACCCCAGGGCCAGCTTTTCCTCACCAGGAGCCCGGCTTC 
CACTCCCCACATAGGAATAGTCCATCCCCAGATTCGCCATTGTTCACCCCTCGCCCTGCC 
CTCCTTTGCCTTCCACCCCCACCATCCAGGTGGAGACCCTGAGAAGGACCCTGGGAGCTC 
TGGGAATTTGGAGTGACCAAAGGTGTGCCCTGTACACAGGCGAGGACCCTGCACCTGGAT 
GGGGGTCCCTGTGGGTCAAATTGGGGGGAGGTGCTGTGGGAGTAAAATACTGAATATATG 
AGTTTTTCAGTTTTGAAAAAAAAAAAAAAAAAAAAAAAAAAAAA 
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1 CCATGGGACCCACTGCAGGGGCAGCTGGGAGGCTGCAGGCTTCAGGTCCCAGTGGGGTTG 
GGTACCCTGGGTGACGTCCCCGTCGACCCTCCGACGTCCGAAGTCCAGGGTCACCCCAAC 

6 1 C CAT CTGC CAGTAGAAAC CTGATGTAGAATCAGGGCG CGAGTGTGGACACTGTCCTGAAT 
GGTAGACGGTCATCTTTGGACTACATCTTAGTCCCGCGCTCACACCTGTGACAGGACTTA 

121 CTCAATGTCTCAGTGTGTGCTGAAACATGTAGAAATTAAAGTCCATCCCTCCTACTCTAC 
GAGTTACAGAGTCACACACGACTTTGTACATCTTTAATTTCAGGTAGGGAGGATGAGATG 

181 TGGGATTGAGCCCCTTCCCTATCCCCCCCCAGGGGCAGAGGAGTTCCTCTGACTCCTGTG 
AC C CTAACTCGGGGAAGGGATAGGGGGGGGTCCC CGTCTC CT CAAGGAGAGTGAGGACAC 

241 GAGGAAGGAATGATACTTTGTTATTTTTCACTGCTGGTACTGAATCCACTGTTTCATTTG 
CTCCTTCCTTACTATGAAACAATAAAAAGTGACGACCATGACTTAGGTGACAAAGTAAAC 



**************************************** 

3 01 TTGGTTTGTTTGTTTTGTTTTGAGAGGCGGTTTCACTCTTGTTGCTCAGGCTGGAGGGAG 
AACC^W^ACAAACAAAACAAAACTCTCCGCCAAAGTGAGAACAACGAGTCCGACCTCCCTC 



************************************************************ 

361 TGCAATGGCGCGATCTTGGCTTACTGCAGCCTCTGCCTCCCAGGTTCAAGTGATTCTCCT 
ACGTTACCGCGCTAGAACCGAATGACGTCGGAGACGGAGGGTCCAAGTTCACTAAGAGGA 

alu 

************************************************************ 

421 GCTTCCGCCTCCCATTTGGCTGGGATTACAGGCACCCGCCACCATGCCCAGCTAATTTTT 
CGAAGGCGGAGGGTAAACCGACCCTAATGTCCGTGGGCGGTGGTACGGGTCGATTAAAAA 



************************************************************ 

481 TGTATTTTTAGTAGAGACGGGGGTGGGGGTGGGGTTCACCATGTTGGCCAGGCTGGTCTC 
AC^TAAAAATCATCTCTGCCCCC^CCCCCACCCCAAGTC^ 

CAP 



************************************************************ 

54 1 GAACTTCTGACCTCAGATGATCCACCTGCCTCTGCCTCCTAAAGTGCTGGGATTACAGGT 
CTTGAAGACTGGAGTCTACTAGGTGGACGGAGACGGAGGATTTCACGACCCTAATGTCCA 



********************* 

6 01 GTGAGCCACCATGCCCAGCTCAGAATTTACTCTGTTTAGAAACATCTGGGTCTGAGGTAG 
CACTCGGTGGTACGGGTCGAGTCTTAAATGAGACAAATCTTTGTAGACCCAGACTCCATC 

CCAAT 
*************** > 

661 GAAGCTCACCCCT^CTCAAGTGTTGTGGTGTTTTAAGCCAATGATAGAATTTTTTTATTGT 
CTTCGAGTGGGGTGAGTTC^CAACACC^CAAAATTCGGTTACTATCTTAAAAAAATAAC^ 

721 TGTTAGAACACTCTTGATGTTTTACACTGTGATGACTAAGACATCATCAGCTTTTCAAAG 
ACAATCTTGTGAGAACTACAAAATGTGACACTACTGATTCTGTAGTAGTCGAAAAGTTTC 
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CAP 



> 



781 ACACACTAACTGCACCCATAATACTGGGGTGTCTTCTGGGTATCAGCGATCTTCATTGAA 
TGTGTGATTGACGTGGGTATTATGACC C CACAGAAGACC CATAGT CGCTAGAAGTAACTT 

CAP 

841 TGCCGGGAGGCGTTTCCTCGCCATGCACATGGTGTTAATTACTCCAGCATAATCTTCTGC 
ACGGCCCTCCGCAAAGGAGCGGTACGTGTACCACAATTAATGAGGTCGTATTAGAAGACG 



901 TTCCATTTCTTCTCTTCCCTCTTTTAAAATTGTGTTTTCTATGTTGGCTTCTCTGCAGAG 
AAGGTAAAGAAGAGAAGGGAGAAAATTTTAACACAAAAGATACAACCGAAGAGACGTCTC 

CAP 

961 AACCAGTGTAAGCTACAACTTAACTTTTGTTGGAACAAATTTTCCAAACCGCCCCTTTGC 
TTGGTCACATTCGATGTTGAATTGAAAACAACCTTGTTTAAAAGGTTTGGCGGGGAAACG 

1021 CCTAGTGGCAGAGACAATTCACAAACACAGCCCTTTAAAAAGGCTTAGGGATCACTAAGG 
GGATCACCGTCTCTGTTAAGTGTTTGTGTCGGGAAATTTTTCCGAATCCCTAGTGATTCC 

1081 GGATTTCTAGAAGAGCGACCCGTAATCCTTAAGTATTTACAAGACGAGGCTAACCTCCAG 
CCTAAAGATCTTCTCGCTGGGCATTAGGAATTCATAAATGTTCTGCTCCGATTGGAGGTC 

1141 CGAGCGTGACAG C CCAGGGAGGGTGCGAGGCCTGTTCAAATGCTAAGCTTC CATAAATAA 
GCTCGCACTGTCGGGTCCCTCCCACGCTCCGGACAAGTTTACGATTCGAAGGTATTTATT 

12 01 AGCAAATTTCCTCCGGCAGTTTCTGGAAAGTAGGAAAGGTTAACATTTAAGGTTGCGTTT 

TCGTTTAAAGGAGGCCGTCAAAGACCTTTCATCCTTTCCAATTGTAAATTCCAACGCAAA 

1261 GTTAGCATTTCAGTGTTTGCCGACCTCAGCTAACAGCATCCCTGCAAGGCCTCGGGAGAC 
CAATCGTAAAGTCACA7VACGGCTGGAGT CGATTGTCGTAGGGACGTTC CGGAGC C CT CTG 

13 21 CCAGAAGTTTCTCGCCCCTTAGATCCAAACTTGAGCAACCCGGAGTCTGGATTCCTGGGA 

GGTCTTCAAAGAGCGGGGAATCTAGGTTTGAACTCGTTGGGCCTCAGACCTAAGGACCCT 

TopoII 

13 81 AGTCCTCAGCTGTCCTGCGGTTGTGCCGGGGCCCCAGGTCTGGAGGGGACCAGTGGCCGT 
TCAGGAGTCGACAGGACGCCAACACGGCCCCGGGGTCCAGACCTCCCCTGGTCACCGGCA 

1441 GTGGCTTCTACTGCTGGGCTGGAAGTCGGGCCTCCTAGCTCTGCAGTCCGAGGCTTGGAG 
CACCGAAGATGACGACCCGACCTTCAGCCCGGAGGATCGAGACGTCAGGCTCCGAACCTC 



1501 CCAGGTGCCTGGACCCCGAGGCTGCCCTCCACCCTGTGCGGGCGGGATGTGACCAGATGT 
GGTCCACGGACCTGGGGCTCCGACGGGAGGTGGGACACGCCCGCCCTACACTGGTCTACA 

1561 TGGCCTCATCTGCCAGACAGAGTGCCGGGGCCCAGGGTCAAGGCCGTTGTGGCTGGTGTG 
ACCGGAGTAGACGGTCTGTCTCACGGCCCCGGGTCCCAGTTCCGGCAACACCGACCACAC 

1621 AGGCGCCCGGTGCGCGGCCAGCAGGAGCGCCTGGCTCCATTTCCCACCCTTTCTCGACGG 
TCCGCGGGCCACGCGCCGGTCGTCCTCGCGGACCGAGGTAAAGGGTGGGAAAGAGCTGCC 



FIG. 21B 



30/103 



1681 GACCGCCCCGGTGGGTGATTAACAGATATTGGGGTGGTTTGCTCATGGTGGGGACCCCTT 
CTGGCGGGGCCACCCACTAATTGTCTATAACCCCA.CCAAACGAGTACCACCCCTGGGGAA 

1741 CGCCGCCTGAGAACCTGCAAAGAGAAATGACGGGCCTGTGTCAAGGAGCCCAAGTCGCGG 
GCGGCGGACTCTTGGACGTTTCTCTTTACTGCCCGGACACAGTTCCTCGGGTTCAGCGCC 

18 01 GGAAGTGTTGCAGGGAGGCACTCCGGGAGGTCCCGCGTGCCCGTCCAGGGAGCAATGCGT 
CCTTCACAACGTCCCTCCGTGAGGCCCTCCAGGGCGCACGGGCAGGTCCCTCGTTACGCA 

1861 CCTCGGGTTCGTCCCCAGCCGCGTCTACGCGCCTCCGTCCTCCCCTTCACGTCCGGCATT 
GGAGCC CAAGCAGGGGTCGGCGCAGATG CGCGGAGGCAGGAGGGGAAGTGCAGGC CGTAA 

1921 CGTGGTGCCCGGAGCCCGACGCCCCGCGTCCGGACCTGGAGGCAGCCCTGGGTCTCCGGA 
GCACCACGGGCCTCGGGCTGCGGGGCGCAGGCCTGGACCTCCGTCGGGACCCAGAGGCCT 

1981 TCAGGCCAGCGGCCAAAGGGTCGCCGCACGCACCTGTTCCCAGGGCCTCCACATCATGGC 
AGTCCGGTCGCCGGTTTCCCAGCGGCGTGCGTGGACAAGGGTCCCGGAGGTGTAGTACCG 

2 041 CCCTCCCTCGGGTTACCCCACAGCCTAGGCCGATTCGACCTCTCTCCGCTGGGGCCCTCG 
GGGAGGGAGCCCAATGGGGTGTCGGATCCGGCTAAGCTGGAGAGAGGCGACCCCGGGAGC 

Spl 

2101 CTGGCGTCCCTGCACCCTGGGAGCGCGAGCGGCGCGCGGGCGGGGAAGCGCGGCCCAGAC 
GACCGCAGGGACGTGGGACCCTCGCGCTCGCCGCGCGCCCGCCCCTTCGCGCCGGGTCTG 

2161 CCCCGGGTCCGCCCGGAGCAGCTGCGCTGTCGGGGCCAGGCCGGGCTCCCAGTGGATTCG 
GGGGCCCAGGCGGGCCTCGTCGACGCGACAGCCCCGGTCCGGCCCGAGGGTCACCTAAGC 

2221 CGGGCAACAGACGCCCAGGACCGCGCTTCCCACGTGGCGGAGGGACTGGGGACCCGGGCA 
GCCCGTTGTCTGCGGGTCCTGGCGCGAAGGGTGCACCGCCTCCCTGACCCCTGGGCCCGT 

Spl 



E2F 

2281 CCGGTCCTGCCCCTTCACCTTCCAGCTCCGCCTCGTCCGCGCGGAACCCCGCCCCGTCCC 
GGCCAGGACGGGGAAGTGGAAGGTCGAGGCGGAGCAGGCGCGCCTTGGGGCGGGGCAGGG 

2341 GAACCCTTCCCGGGTCCCCGGCCCAGCCCCTTCCGGGCCATCCCAGCCCGTCCCGTTCCT 
CTTGGGAAGGGCCCAGGGGCCGGGTCGGGGAAGGCCCGGTAGGGTCGGGCAGGGCAAGGA 

Spl 



E2F NFkB 
★★★****** ********* ******************** 

24 01 TTTCCGCGGCCCCGCCCTCTCCTCGCGGCGCGAGTTTCAGGCAGCGCTGCGTCCTGCTGC 
AAAGGCGCCGGGGCGGGAGAGGAGCGCCGCGCTCAAAGTCCGTCGCGACGCAGGACGACG 

hTRTS ' 

*****************************> 

2461 GCACGTGGGAAGCCCTGGCCCCGGCCACCCCCGCGATGCCGCGCGCTCCCCGCTGCCGAG 
CGTGCACCCTTCGGGACCGGGGCCGGTGGGGGCGCTACGGCGCGCGAGGGGCGACGGCTC 

2521 CCGTGCGCTCCCTGCTGCGCAGCCACTACCGCGAGGTGCTGCCGCTGGCCACGTTCGTGC 
GGCACGCGAGGGACGACGCGTCGGTGATGGCGCTCCACGACGGCGACCGGTGCAAGCACG 
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E2F 
**** ** * 

2581 GGCGCCTGGGGCCCCAGGGCTGGCGGCTGGTGCAGCGCGGGGACCCGGCGGCTTTCCGCG 
CCGCGGACCCCGGGGTCCCGACCGCCGACCACGTCGCGCCCCTGGGCCGCCGAAAGGCGC 



★ 

2641 CGCTGGTGGCCCAGTGCCTGGTGTGCGTGCCCTGGGACGCACGGCCGCCCCCCGCCGCCC 
GCGACCACCGGGTCACGGACCACACGCACGGGACCCTGCGTGCCGGCGGGGGGCGGCGGG 

NFkB 



********************************************** 

2701 CCTCCTTCCGCCAGGTGGGCCTCCCCGGGGTCGGCGTCCGGCTGGGGTTGAGGGCGGCCG 
GGAGGAAGGCGGTCCACCCGGAGGGGCCCCAGCCGCAGGCCGACCCCAACTCCCGCCGGC 

Topo_II_cleavag 



NFkB 
++++++++++ 
NFkB 



Intronl 

****************************^ 

2761 GGGGGAACCAGCGACATGCGGAGAGCAGCGCAGGCGACTCAGGGCGCTTCCCCCGCAGGT 
CCCCCTTGGTCGCTGTACGCCTCTCGTCGCGTCCGCTGAGTCCCGCGAAGGGGGCGTCCA 

e site 



2821 GTCCTGCCTGAAGGAGCTGGTGGCCCGAGTGCTGCAGAGGCTGTGCGAGCGCGGCGCGAA 
CAGGACGGACTTCCTCGACCACCGGGCTCACGACGTCTCCGACACGCTCGCGCCGCGCTT 

2881 GAACGTGCTGGCCTTCGGCTTCGCGCTGCTGGACGGGGCCCGCGGGGGCCCCCCCGAGGC 
CTTGCACGACCGGAAGCCGAAGCGCGACGACCTGCCCCGGGCGCCCCCGGGGGGGCTCCG 



2 941 CTTCACCACCAGCGTGCGCAGCTACCTGCCCAACACGGTGACCGACGCACTGCGGGGGAG 

GAAGTGGTGGTCGCACGCGTCGATGGACGGGTTGTGCCACTGGCTGCGTGACGCCCCCTC 

3 001 CGGGGCGTGGGGGCTGCTGCTGCGCCGCGTGGGCGACGACGTGCTGGTTCACCTGCTGGC 

GCCCCGCACCCCCGACGACGACGCGGCGCACCCGCTGCTGCACGACCAAGTGGACGACCG 

3 061 ACGCTGCGCGCTCTTTGTGCTGGTGGCTCCCAGCTGCGCCTACCAGGTGTGCGGGCCGCC 
TGCGACGCGCGAGAAACACGACCACCGAGGGTCGACGCGGATGGTCCACACGCCCGGCGG 

3121 GCTGTACCAGCTCGGCGCTGCCACTCAGGCCCGGCCCCCGCCACACGCTAGTGGACCCCG 
CGACATGGTCGAGCCGCGACGGTGAGTCCGGGCCGGGGGCGGTGTGCGATCACCTGGGGC 

3181 AAGGCGTCTGGGATGCGAACGGGCCTGGAACCATAGCGTCAGGGAGGCCGGGGTCCCCCT 
TTCCGCAGACCCTACGCTTGCCCGGACCTTGGTATCGCAGTCCCTCCGGCCCCAGGGGGA 

3241 GGGCCTGCCAGCCCCGGGTGCGAGGAGGCGCGGGGGCAGTGCCAGCCGAAGTCTGCCGTT 
CCCGGACGGTCGGGGCCCACGCTCCTCCGCGCCCCCGTCACGGTCGGCTTCAGACGGCAA 

33 01 GCCCAAGAGGCCCAGGCGTGGCGCTGCCCCTGAGCCGGAGCGGACGCCCGTTGGGCAGGG 
CGGGTTCTCCGGGTCCGCACCGCGACGGGGACTCGGCCTCGCCTGCGGGCAACCCGTCCC 
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3361 GTCCTGGGCCCACCCGGGCAGGACGCGTGGACCGAGTGACCGTGGTTTCTGTGTGGTGTC 
CAGGACCCGGGTGGGCCCGTCCTGCGC^CCTGGCTCACTGGCACCAAAGACACACa^CAG 

3421 ACCTGCCAGACCCGCCGAAGAAGCCACCTCTTTGGAGGGTGCGCTCTCTGGCACGCGCCA 
TGGACGGTCTGGGCGGCTTCTTCGGTGGAGAAACCTCCCACGCGAGAGACCGTGCGCGGT 

34 81 CTCCCACCCATCCGTGGGCCGCCAGCACCACGCGGGCCCCCCATCCACATCGCGGCCACC 
GAGGGTGGGTAGGCACCCGGCGGTCGTGGTGCGCCCGGGGGGTAGGTGTAGCGCCGGTGG 

3541 ACGTCCCTGGGACACGCCTTGTCCCCCGGTGTACGCCGAGACCAAGCACTTCCTCTACTC 
TGCAGGGACCCTGTGCGGAACAGGGGGCCACATGCGGCTCTGGTTCGTGAAGGAGATGAG 

36 01 CTCAGGCGACAAGGAGCAGCTGCGGCCCTCCTTCCTACTCAGCTCTCTGAGGCCCAGCCT 
GAGTCCGCTGTTCCTCGTCGACGCCGGGAGGAAGGATGAGTCGAGAGACTCCGGGTCGGA 

3661 GACTGGCGCTCGGAGGCTCGTGGAGACCATCTTTCTGGGTTCCAGGCCCTGGATGCCAGG 
CTGACCGCGAGCCTCCGAGCACCTCTGGTAGAAAGACCCAAGGTCCGGGACCTACGGTCC 

3 721 GACTCCCCGCAGGTTGCCCCGCCTGCCCCAGCGCTACTGGCAAATGCGGCCCCTGTTTCT 
CTGAGGGGCGTCCAACGGGGCGGACGGGGTCGCGATGACCGTTTACGCCGGGGACAAAGA 

3781 GGAGCTGCTTGGGAACCACGCGCAGTGCCCCTACGGGGTGCTCCTCAAGACGCACTGCCC 
CCTCGACGAACCCTTGGTGCGCGTCACGGGGATGCCCCACGAGGAGTTCTGCGTGACGGG 

3841 GCTGCGAGCTGCGGTCACCCCAGCAGCCGGTGTCTGTGCCCGGGAGAAGCCCCAGGGCTC 
CGACGCTCGACGCCAGTGGGGTCGTCGGCCACAGACACGGGCCCTCTTCGGGGTCCCGAG 

3 901 TGTGGCGGCCCCCGAGGAGGAGGACACAGACCCCCGTCGCCTGGTGCAGCTGCTCCGCCA 
ACACCGCCGGGGGCTCCTCCTCCTGTGTCTGGGGGCAGCGGACCACGTCGACGAGGCGGT 

3 961 GCACAGCAGCCCCTGGCAGGTGTACGGCTTCGTGCGGGCCTGCCTGCGCCGGCTGGTGCC 

CGTGTCGTCGGGGACCGTCCACATGCCGAAGCACGCCCGGACGGACGCGGCCGACCACGG 

4 021 CCCAGGCCTCTGGGGCTCCAGGCACAACGAACGCCGCTTCCTCAGGAACACCAAGAAGTT 

GGGTCCGGAGACCCCGAGGTCCGTGTTGCTTGCGGCGAAGGAGTCCTTGTGGTTCTTCAA 



4 081 CATCTCCCTGGGGAAGCATGCCAAGCTCTCGCTGCAGGAGCTGACGTGGAAGATGAGCGT 
GTAGAGGGACCCCTTCGTACGGTTCGAGAGCGACGTCCTCGACTGCACCTTCTACTCGCA 



**************************** 
4141 GCGGGACTGCGCTTGGCTGCGCAGGAGCCCAGGTGAGGAGGTGGTGGCCGTCGAGGGCCC 
CGCCCTGACGCGAACCGACGCGTCCTCGGGTCCACTCCTCCACCACCGGCAGCTCCCGGG 

Intron2 

****************************^ 

42 01 AGGCC CCAGAGCTGAATGCAGTAGGGGCT CAGAAAAGGGGGCAGG CAGAGC CCTGGTC CT 
TCCGGGGTCTCGACTTACGTCATCCCCGAGTCTTTTCCCCCGTCCGTCTCGGGACCAGGA 



4261 CCTGTCTCCATCGTCACGTGGGCACACGTGGCTTTTCGCTCAGGACGTCGAGTGGACACG 
GGACAGAGGTAGCAGTGCACCCGTGTGCACCGAAAAGCGAGTCCTGCAGCTCACCTGTGC 



4321 GTGATCGAGGTCGAC 
CACTAGCTCCAGCTG 
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gccaagttcctgcactggctgatgagtgtgtacgtcgtcgagctgctcaggtctttcttt 
tatgtcacggagaccacgtttcaaaagaacaggctctttttctaccggaagagtgtctgg 
agcaagttgcaaagcattggaatcagacagcacttgaagagggtgcagctgcgggacgtg 
tcggaagcagaggtcaggcagcatcgggaagccaggcccgccctgctgacgtccagactc 
cgcttcatccccaagcctgacgggctgcggccgattgtgaacatggactacgtcgtggga 
gccagaacgttccgcagagaaaagagggccgagcgtctcacctcgagggtgaaggcactg 
ttcagcgtgctcaactacgagcgggcgcg 

F/G. 23 



TCTACCTTGACAGACCTCCAGCCGTACATGCGACAGTTCGTGGCTCACCTGCAGGAG 
ACCAGCCCGCTGAGGGATGCCGTCGTCATCGAGCAGAGCTCCTCCCTGAATGAGGCC 
AGCAGTGGCCTCTTCGACGTCTTCCTACGCTTCATGTGCCACCACGCCGTGCGCATC 
AGGGGCAAGTC 
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Glyc. grad. 

fractions pmol RSA 
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Gradient 
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Telomerase: 
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3' TELOMERASE 



TEMPLATE 

CCAAAACCCCAAAAC ■ 
ttTT GGGG-3' 



5' 




3' TELOMERASE 



TEMPLATE 

CCAAAACCCCAAAAC 

_ gG GGTTTT-3 ' 



5' 




PANEL A 



PANEL B 
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1 CCCCAAAACC CCAAAACCCC AAAACCCCTA TAAAAAAAGA AAAAATTGAG 

51 GTAGTTTAGA AATAAAATAT TATTCCCGCA CAAATGGAGA TGGATATTGA 

101 TTTGGATGAT ATAGAAAATT TACTTCCTAA TACATTCAAC AAGTATAGCA 

151 GCTCTTGTAG TGACAAGAAA GGATGCAAAA CATTGAAATC TGGCTCGAAA 

2 01 TCGCCTTCAT TGACTATTCC AAAGTTGCAA AAACAATTAG AGTTCTACTT 

2 51 CTCGGATGCA AATCTTTATA ACGATTCTTT CTTGAGAAAA TTAGTTTTAA 

3 01 AAAGCGGAGA GCAAAGAGTA G AAAT TG AAA CATTACTAAT GTTTAAATAA 

3 51 AATCAGGTAA TGAGGATTAT TCTATTTTTT AGATCACTTC TTAAGGAGCA 

4 01 TTATGGAGAA AATTAC TTAA TACTAAAAGG TAAACAGTTT GGATTATTTC 

4 51 CCTAGCCAAC AATGATGAGT ATATTAAATT CATATGAGAA TGAGTCAAAG 

5 01 GATCTCGATA CATCAGACTT ACCAAAGACA AACTCGCTAT AAAACGCAAG 

5 51 AAAAAGTTTG ATAATCGAAC AGCAGAAGAA CTTATTGCAT TTACTATTCG 

6 01 TATGGGTTTT ATTACAATTG TTTTAGGTAT CGACGGTGAA CTCCCGAGTC 
651 TTGAGACAAT TGAAAAAGCT GTTTACAACT GAAGGAATCG CAGTTCTGAA 

7 01 AGTTCTGATG TGTATGCCAT TATTTTGTGA ATTAATCTCA AATATCTTAT 
751 CTCAATTTAA TGGATAGCTA TAGAAACAAA CCAAATAAAC CATGCAAGTT 

8 01 TAATGGAATA TACGTTAAAT CCTTTGGGAC AAATGCACAC TGAATTTATA 

8 51 TTGGATTCTT AAAGCATAGA TACACAGAAT GCTTTAGAGA CTGATTTAGC 

9 01 TTACAACAGA TTACCTGTTT TGATTACTCT TGCTCATCTC TTATATCTTT 
951 AAAAGAAGCA GGCGAAATGA AAAGAAGACT AAAGAAAGAG ATTTCAAAAT 

10 01 TTGTTGATTC TTCTGTAACC GGAATTAACA ACAAGAATAT TAGCAACGAA 

10 51 AAAGAAGAAG AGCTATCACA ATCCTGATTC TTAAAGATTT CAAAAATTCC 

1101 AGGTAAGAGA GATACATTCA TTAAAATTCA TATATTATAG TTTTTCATTT 

1151 CACAGCTGTT ATTTTCTTTT ATCTTAACAA TATTTTTTGA . TTAGCTGGAA 

12 01 GTAAAAAGTA TCAAATAAGA GAAGCGCTAG ACTGAGGTAA CTTAGCTTAT 

12 51 TC AC ATT CAT AGATCGACCT TCATATATCC AATACGATGA TAAGGAAACA 

13 01 GCAGTCATCC GTTTTAAAAA TAGTGCTATG AGGACTAAAT TTTTAGAGTC 

13 51 AAGAAATGGA GCCGAAATCT TAATCAAAAA GAATTGCGTC GATATTGCAA 

14 01 AAGAATCGAA CTCTAAATCT TTCGTTAATA AGTATTACCA ATCTTGATTG 

14 51 ATTGAAGAGA TTGACGAGGC AACTGCACAG AAGATCATTA AAGAAATAAA 

15 01 GTAACTTTTA TTAATTAGAG AATAAACTAA ATTACTAATA TAGAGATCAG 
1551 CGATCTTCAA TTGACGAAAT AAAAGCTGAA CTAAAGTTAG ACAATAAAAA 
1601 ATACAAACCT TGGTCAAAAT ATTGAGGAAG GAAAAGAAGA CCAGTTAGCA 
1651 AAAGAAAAAA TAAGGCAATA AATAAAATGA GTACAGAAGT GAAGAAATAA 
17 01 AAGATTTATT TTTTTCAATA ATTTATTGAA AAGAGGGGTT TTGGGGTTTT 
1751 GGGGTTTTGG GG 
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CCCCAAAACCCCAAAACCCCA?\AACCCCTATAAAAAAAGAAAAAATTGAGGTAGTTTAGA 

1 + + + + + + 60 

GGGGTTTTGGGGTTTTGGGGTTTTGGGGATATTTTTTTCTTTTTTAACTCCATCAAATCT 

a PQNPKTPKPL*KKKKLR*FR 

b PKTPKPQNPYKKRKNCGSLE- 

c PKPQNPKTP I KKE KI EVV* K - 

AATAAAATATTATTCCCGCACAAATGGAGATGGATATTGATTTGGATGATATAGAAAATT 
61 + + + + + + 120 

TTATTTTATAATAAGGGCGTGTTTACCTCTACCTATAACTAAACCTACTATATCTTTTAA 

a NKILFPHKWRWILIWMI*KI 

b IKYYSRTNGDGYCFGCYRKF- 

C * N I IPAQMEMDIDLDDIENL- 

TACTTCCTAATACATTCAACAAGTATAGCAGCTCTTGTAGTGACAAGAAAGGATGCAAAA 

121 + + + + + + 180 

ATGAAGGATTATGTAAGTTGTTCATATCGTCGAGAACATCACTGTTCTTTCCTACGTTTT 

a YFLIHSTSIAALVVTRKDAK 

b TS*YIQQV*QLL*CQERMQN- 

c L PNTFNKYS SS CSDKKGCKT- 

CATTGAAATCTGGCTCGAAATCGCCTTCATTGACTATTCCAAAGTTGCAAAAACAATTAG 

181 + + -f + + + 240 

GTAACTTTAGACCGAGCTTTAGCGGAAGTAACTGATAAGGTTTCAACGTTTTTGTTAATC 

a HCNLARNRLHCLFQSCKNN* 

b IEI'WLEIAFIDYSKVAKTIR- 

C LKSGSKS PSLTI PKLQKQLE- 

AGTTCTACTTCTCGGATGCAAATCTTTATAACGATTCTTTCTTGAGAAAATTAGTTTTAA 

241 + + + + + + 300 

TCAAGATGAAGAGCCTACGTTTAGAAATATTGCTAAGAAAGAACTCTTTTAATCAAAATT 

a SSTSRMQIFITILSCEN*F* 

b VLLLGCKSL*RFFLEKISFK- 

C FYFSDANLYNDS FLRKLVLK- 

AAAGCGGAGAGCAAAGAGTAGAAATTGAAACATTACTAATGTTTAAATAAAATCAGGTAA 

301 + + + + + + 360 

TTTCGCCTCTCGTTTCTCATCTTTAACTTTGTAATGATTACAAATTTATTTTAGTCCATT 

a KAESKE * KLKHY* CLNKIR* 

b KRRAKSRNCNITNV* IKSGN- 

C SGEQRVE I ETLLMFK*NQVM- 

TGAGGATTATTCTATTTTTTAGATCACTTCTTAAGGAGCATTATGGAGAAAATTACTTAA 

361 + + + + + + 420 

ACTCCTAATAAGATAAAAAATCTAGTGAAGAATTCCTCGTAATACCTCTTTTAATGAATT 

a CGLFYFLDHFLRS IMEKIT* 

b EDYSIF* ITS*GALWRKLLN- 

C RIILFFRSLLKEHYGENYLI- 
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TACTAAAAGGTAAACAGTTTGGATTATTTCCCTAGCCAACAATGATGAGTATATTAAATT 

421 + + + + + + 480 

ATGATTTTCCATTTGTCAAACCTAATAAAGGGATCGGTTGTTACTACTCATATAATTTAA 

a Y*KVNSLDYFPSQQCCVY*I 

b TKR*TVWIISLANNDEYIKF- 

C LKGKQFGLFP* PTMMS I LNS- 

CATATGAGAATGAGTCAAAGGATCTCGATACATCAGACTTACCAAAGACAAACTCGCTAT 

481 + + + + + + 540 

GTATACTCTTACTCAGTTTCCTAGAGCTATGTAGTCTGAATGGTTTCTGTTTGAGCGATA 

a HMRMSQRISIHQTYQRQTRY 

b 'lCECVKGSRYIRLTKDKLAI - 

C Y E N E S KDLDTSDLPKTNSL*- 

AAAACGCAAGAAAAAGTTTGATAATCGAACAGCAGAAGAACTTATTGCATTTACTATTCG 
541 + + + + + + 600 

TTTTGCGTTCTTTTTCAAACTATTAGCTTGTCGTCTTCTTGAATAACGTAAATGATAAGC 

a KTQEKVC*SNSRRTYCIYYS 

b KRKKKFDNRTAEELIAFTIR- 

c NARKSLI IEQQKNLLHLLFV- 

TATGGGTTTTATTACAATTGTTTTAGGTATCGACGGTGAACTCCCGAGTCTTGAGACAAT 

601 + + + + + + 660 

ATACCCAAAATAATGTTAACAAAATCCATAGCTGCCACTTGAGGGCTCAGAACTCTGTTA 

a YGFYYNC FRYRRCT PE S CDN 

b MGF ITIVLGIDGELPSLETI 

C WVLLQLF*VSTVNSRVLRQL- 

TGAAAAAGCTGTTTACAACTGAAGGAATCGCAGTTCTGAAAGTTCTGATGTGTATGCCAT 

661 + + + + + + 720 

ACTTTTTCGACAAATGTTGACTTCCTTAGCGTCAAGACTTTCAAGACTACACATACGGTA 

a CKSCLQLKESQFCKFCCVCH 

b EKAVYNCRNRSSESSDVYAI 

C KKLFTTEGIAVLKVLMCMPL- 

TATTTTGTGAATTAATCTCAAATATCTTATCTCAATTTAATGGATAGCTATAGAAACAAA 

721 + + + + + + 780 

ATAAAACACTTAATTAGAGTTTATAGAATAGAGTTAAATTACCTATCGATATCTTTGTTT 

a YFVN* SQISYLNLMDSYRNK 

b ILCINLKYLISI*WIAIETN- 

C FCELI SNILSQFNG* L* KQT- 

CCAAATAAACCATGCAAGTTTAATGGAATATACGTTAAATCCTTTGGGACAAATGCACAC 

781 + + + + + + 840 

GGTTTATTTGGTACGTTCAAATTACCTTATATGCAATTTAGGAAACCCTGTTTACGTGTG 

a PNKPCKFNGIYVKS FGTNAH 

b Q INHASLMEYTLNPLGQMHT 

C K*TMQV*WNIR* ILWDKCTL- 

TGAATTTATATTGGATTCTTAAAGCATAGATACACAGAATGCTTTAGAGACTGATTTAGC 

841 + + + + + + 900 

AC T T AAAT AT AAC C T AAG AAT T T C GTAT C T ATG TGT C T T AC GAAAT C T C TG AC T AAAT C G 

a CIYIGFLKHRYTECFRDCFS 

b EFILDS * SIDTQNALETDLA- 

C NLYWI LKA* IHRML* RL I * L- 



FIG. 35B 



+ 



44/103 



TTACAACAGATTACCTGTTTTGATTACTCTTGCTCATCTCTTATATCTTTAAAAGAAGCA 



901 



+ 960 



AATGTTGTCTAATGGACAAAACTAATGAGAACGAGTAGAGAATATAGAAATTTTCTTCGT 



b 



a 



c 



LQQITCFDYSCSSLISLKEA 
YNRLPVLITLAHLLYL* KKQ 
TTDYLFCLLLLISYIFKRS] 



R - 



GGCGAAATGAAAAGAAGACTAAAGAAAGAGATTTCAAAATTTGTTGATTCTTCTGTAACC 

961 + + + + + + 1020 

CCGCTTTACTTTTCTTCTGATTTCTTTCTCTAAAGTTTTAAACAACTAAGAAGACATTGG 

a GEMKRRLKKEISKFVDSSVT 

b AKCKED*RKRFQNLLILL*P- 

c RNEKKTKERDFKI CCFFCNR- 

GGAATTAACAACAAGAATATTAGCAACGAAAAAGAAGAAGAGCTATCACAATCCTGATTC 

1021 + 4- + + + + 1080 

CCTTAATTGTTGTTCTTATAATCGTTGCTTTTTCTTCTTCTCGATAGTGTTAGGACTAAG 

a GINNKNISNEKEEELSQSCF 

b ELTTR I LATKKKKSYHNPDS 

C N*QQEY * QRKRRRAI TI L I L - 

TTAAAGATTTCAAAAATTCCAGGTAAGAGAGATACATTCATTAAAATTCATATATTATAG 

1081 + + + + + + 1140 

AATTTCTAAAGTTTTTAAGGTCCATTCTCTCTATGTAAGTAATTTTAAGTATATAATATC 

a LKISKIPGKRDTFIKIHIL* 

b *RFQKFQVREIHSLKFIYYS- 

C KDFKNSR*ERYIH*NSYI IV- 

TTTTTCATTTCACAGCTGTTATTTTCTTTTATCTTAACAATATTTTTTGATTAGCTGGAA 

1141 + + + + + + 1200 

AAAAAGTAAAGTGTCGACAATAAAAGAAAATAGAATTGTTATAAAAAACTAATCGACCTT 

a FFISQLLFSFILTIFFD*LE 

b FSFHSCYFLLS*QYFLISWK- 

C FHFTAVI FFYLNNI FCLAGS- 

GTAAAAAGTATCAAATAAGAGAAGCGCTAGACTGAGGTAACTTAGCTTATTCACATTCAT 

1201 + + + + + + 1260 

CATTTTTCATAGTTTATTCTCTTCGCGATCTGACTCCATTGAATCGAATAAGTGTAAGTA 

a VKSIK*EKR*TEVT*LIHIH 

b *KVSNKRSARLR* LSLFTFI 

c KKYQI REALDCGNLAYSHS * - 

AGATCGACCTTCATATATCCAATACGATGATAAGGAAACAGCAGTCATCCGTTTTAAAAA 

1261 + + + + + + 1320 

TCTAGCTGGAAGTATATAGGTTATGCTACTATTCCTTTGTCGTCAGTAGGCAAAATTTTT 

a RSTFIYPIRC*GNSSHPF*K 

b DRPSYIQYDDKETAVIRFKN- 

C I DLHI SNTMIRKQQS SVLKI- 

TAGTGCTATGAGGACTAAATTTTTAGAGTCAAGAAATGGAGCCGAAATCTTAATCAAAAA 

1321 + + + + 4- + 1380 

ATCACGATACTCCTGATTTAAAAATCTCAGTTCTTTACCTCGGCTTTAGAATTAGTTTTT 

a * CYED* I FRVKKWSRNLNQK 

b SAMRTKFLE SRNGAE I L IKK- 

c VLCGLNF* SQEMEPKS* SKR- 
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GAATTGCGTCGATATTGCAAAAGAATCGAACTCTAAATCTTTCGTTAATAAGTATTACCA 

1381 + + + + + + 1440 

CTTAACGCAGCTATAACGTTTTCTTAGCTTGAGATTTAGAAAGCAATTATTCATAATGGT 

a ELRRYCKRIEL* I F R * *VLP 

b NCVDIAKESNSKSFVNKYYQ 

C IAS ILQKNRTLNLSLIS I T N - 

ATCTTGATTGATTGAAGAGATTGACGAGGCAACTGCACAGAAGATCATTAAAGAAATAAA 

1441 + + + + + + 1500 

TAGAACTAACTAACTTCTCTAACTGCTCCGTTGACGTGTCTTCTAGTAATTTCTTTATTT 

a ILIDCRDCRGNCTEDH*RNK 

b SCLIEEIDEATAQKI IKEIK - 

c LDCLKRLTRQLHRRSLKK* S - 

GTAACTTTTATTAATTAGAGAATAAACTAAATTACTAATATAGAGATCAGCGATCTTCAA 

1501 + + + + + + 1560 

CATTGAAAATAATTAATCTCTTATTTGATTTAATGATTATATCTCTAGTCGCTAGAAGTT 

a VTFIN*RIN*ITNIEISDLQ 

b *LLLIRE*TKLLI*RSAIFN- 

c NFY*LENKLNY*YRDQRSS I- 

TTGACGAAATAAAAGCTGAACTAAAGTTAGACAATAAAAAATACAAACCTTGGTCAAAAT 

1561 + + + + + + 1620 

AACTGCTTTATTTTCGACTTGATTTCAATCTGTTATTTTTTATGTTTGGAACCAGTTTTA 

a LTK*KLN*S*TIKNTNLGQN 

b CRNKSCTKVRQ*KIQTLVKI 

c DEI KAELKLDNKKYKPWSKY- 

ATTGAGGAAGGAAAAGAAGACCAGTTAGCAAAAGAAAAAATAAGGCAATAAATAAAATGA 

1621 + + - + + + + 1680 

TAACTCCTTCCTTTTCTTCTGGTCAATCGTTTTCTTTTTTATTCCGTTATTTATTTTACT 

a IEEGKEDQLAKEKIRQ* IKC 

b LRKEKKTS*QKKK*GNK*NE 

c CGRKRR PVSKRKNKAINKMS- 

GTACAGAAGTGAAGAAATAAAAGATTTATTTTTTTCAATAATTTATTGAAAAGAGGGGTT 

1681 + + + + + + 1740 

CATGTCTTCACTTCTTTATTTTCTAAATAAAAAAAGTTATTAAATAACTTTTCTCCCCAA 

a VQKCRNKRFI FFNNLLKRGV 

b YRSEEIKDLFFSI IYCKEGF- 

C TEVKK* KIYFFQ* FIEKRGF- 

TTGGGGTTTTGGGGTTTTGGGG 

1741 + + 1762 

AACCCCAAAACCCCAAAACCCC 

a LGFWGFG 
b WGFGVLG 
c GVLGFW 
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ILRQ VE YYF GDAMLNR DKFLREQIGKNEDGWV PLSVLVT 
CLKQVEFYF SEFNFPY3RFLRTTAEK . NDGWVPISTIAT 
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cattgaactt 
tgcaatcttc 
gtatggttcc 
acgttgtgaa 
ttacttagaa 

agagaaagga 

aaagaataaa 
atattcagat 
tgaagtaaat 
taatctaggt 
aatcttaaag 
ctttgccctt 
ctcaccccac 
atttaagtta 
aaagaacaaa 



attactaatt 
ttagaaagta 
gaaaaattgt 
agggttaaga 
taggaaggta 
cttgaggtgg 
gaactttaca 
actcaaccat 
gaagtctgtg 
tatcttgata 
caaagatgcg 
actgaatcct 
tgggattaaa 
gaatctgaag 
aaggctttaa 
cacatgaagg 
gatctcatta 
aaaaaatacc 
cccttcaatc 
aatgaactca 
taactcccat 
gatactacac 
aagatgttcc 
ggattcaagg 
gaagttgttg 
ggagaatttg 
gcaatcaaga 
tctgatgttt 
gttcgtactt 
aagtcctcat 
gttgatctcc 
aaacttggtg 
actcacgtag 
atcaatgtta 
cctaacatta 
gatgagttca 
ttcatttcag 
caaaaaatag 
ttttttgttt 
cttacatagt 
aaagattaaa 



taatcaacaa 
tcaattgaaa 
ggtgggaact 
ttgacgatcc 
gttactacta 

ctgagtctga 

tcagaactac 
tcatcgaaaa 
aatttgcata 
ggatactttc 
tcagaagcaa 
aacgtaagaa 
ctaagaagaa 
ataagtccaa 
aaccagcagt 
cacctaaaat 
agttctgcca 
ctaagaccga 
ctgaattggc 
gtgcaaaagg 
atatggccat 
actctattgt 
ctcttcaatt 
ccaagaagag 
aaaaaaccga 
ttaaagtcaa 
tagcagttaa 
ctggttctat 
gtctcgagtg 
tctacatctt 
ctggagacga 
gtggtactga 
acaatatcgt 
gaggcagttc 
aaatctttgc 
atgaaaacaa 
ccaagcaagg 
gacaaaagtg 
tattgcatag 
ttatgtatcg 
a 



gattgataaa 
aatggaaatt 
tgaattagag 
taagcaatat 
agataaagat 
tcctgagttc 
cactaactac 
gtacttcaac 
ggttctctat 
ataagatatt 
gttttctgaa 
aacaatgttc 
gagaaaagag 
gagagaaact 
tatgaagaaa 
tcctaactct 
tatttctgag 
agaggaatac 
tggaaagcgt 
caacactgct 
gttacgtaac 
gatcaacaag 
ctttagtgcc 
agaaaatatg 
tgaagagaag 
cgaaggaatt 
caagaattta 
gagtacctca 
tgcattagtc 
cagttcacct 
actccgtcct 
tttcccctat 
tattttgtct 
cattgttaac 
agttgactta 
ctacatcaag 
aggagcaaat 
agtttcttga 
ccattatgaa 
cagtctatta 



aagcagtaaa 
gaaaacaact 
atgcaagaaa 
ctcgtgaacg 
gaaagaagat 
atctgctagt 
attgtagcat 
aaagcagtac 
atttttgatg 
cgtaaggaac 
ttcaacgaat 
cgttacctct 
aatctcttaa 
ggagacataa 
atagccaaga 
accttggaat 
cctaaagaaa 
aaagcagcct 
atgaagattg 
gaggtttggg 
ttgtctaaca 
atttgtgagc 
attgaagctg 
aatcttaaag 
aaagatatgg 
ggcaagcaat 
gatgaaatca 
atgtcaggtg 
cttggtttga 
agttctcaat 
tctatgtaaa 
gagtgcattg 
gatatgatga 
agcatcaaaa 
gaaggttacg 
atattcggta 
atggtcgaag 
gattcttcta 
atttaaatta 
gcctattcaa 



taaaacccaa 
aagcacaata 
accaaaatga 
tcactgcagc 
atatcatcac 
tggcagtcta 
tttgtgttgt 
ttttgcctaa 
caactgaatt 
tcactttccg 
actaacttgg 
cagttaccaa 
ccaaacttta 
tgaacgttga 
gatagaatgc 
caaagtactt 
gagtctataa 
ttggtgattc 
aaatctctaa 
ataatttaat 
tcttaaaagc 
ccaaggccgt 
ttaatgaagc 
gtcaaatcga 
agttggagta 
acattaactc 
aaggacacac 
gagccaagaa 
tggtaaaata 
gcaataagtg 
aacttttgca 
atgaatggac 
ttgcagaagg 
agtacaagga 
gaaagtgcct 
tgagcgattc 
ttatcaaaaa 
taacaaaaat 
ttatctattt 
atgattctgc 
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MEIENNQAQQPKAEKLWWELELEMQENQNDIQVRVKIDDPKQYL 
VNVTAACLiLQEGSYYQDKDERRYI ITKALLEVAESDPEFICQLA 
VYIRNELYI RTTTNY I VAFC WHKNTQ PFIE KYFNKAVLL PNDL 
LE VCE F AQVL Y I FDATE FKNL YLDR I L SQD I RKELT FRKC LQRC 
VRSKFSEFNEYQLGKYCTESQRKKTMFRYLSVTNKQKWDQTKKK 
RKENLLTKLQAI KESEDKSKRETGDIMNVEDAIKALKPAVMKKI 
AKRQNAMKKHMKAPKI PNSTLESKYLTFKDLIKFCHISEPKERV 
YKI LGKKYPKTEEE YKAAFGDS AS APFNPELAGKRMKI E I SKTW 
ENELSAKGNTAEVWDNLISSNQLPYMAMLRNLSNILKAGVSDTT 
H S I VINKI CE PKAVENS KMF PLQFFS AI EAVNEAVTKGFKAKKR 
ENMNLKGQIEAVKEWEKTDEEKKDMELEQTEEGEFVKVNEGIG 
KQ YINS I ELAI KI AVNKNLDE I KGHTAI FSDVSGSMSTSMSGGA 
KKYGSVRTCLECALVLGLMVKQRCEKSSFYIFSSPSSQCNKCYL 
EVDLPGDELRPSMQKLLQEKGKLGGGTDFPYECIDEWTKNKTHV 
DNIVILSDMMIAEGYSDINVRGSSIVNSIKKYKDEWPNIKIFA 
VDLEGYGKCLNLGDE FNENNY I KI FGMSDS ILKFI S AKQGGANM 
VE VI KNFALQKI GQK 

FIG. 43 

MSRRNQKKPQAP I GNETNLDFVLQNLE VYKSQ I EHYKTQQQQ I K 
EEDLKLLKFKNQDQDGNSGNDDDDEENNSNKQQELLRRVNQIKQ 
QVQL I KKVGS KVE KDLNLNE DENKKNGL S EQQVKEEQLRT I TE E 
QVKYQNLVFNMDYQLDLNESGGHRRHRRETDYDTEKWFEISHDQ 
KNYVS I YANQKTS YCWWLKD YFNKNNYDHLNVS I NRLETEAE FY 
AFDDFSQTIKLTNNSYQTVNIDVNFDNNLCILALLRFLLSLERF 
NILNIRSSYTRNQYNFEKIGELLETIFAWFSHRHLQGIHLQVP 
CEAFQYLVNS S SQ I S VKDSQLQVYS FS TDLKLVDTNKVQD YFKF 
LQEFPRLTHVSQQAI PVSATNAVENLNVLLKKVKHANLNLVS I P 
TQFNFDFYFVNLQHLKLEFGLEPNILTKQKLENLLLSIKQSKNL 
KFLRLNFYTYVAQETSRKQILKQATTIKNLKNNKNQEETPETKD 
ETPSESTSGMKFFDHLSELTELEDFSVNLQATQEIYDSLHKLLI 
RSTNLKKFKLSYKYEMEKS KMDTFIDLKNIYETLNNLKRCSVNI 
SNPHGNISYELTNKDSTFYKFKLTLNQELQHAKYTFKQNEFQFN 
NVKSAKIESSSLESLEDIDSLCKSIASCKNLQNVNI IASLLYPN 
NIQKNPFNKPNLLFFKQFEQLKNLENVSINCILDQHILNSISEF 
LEKNKKIKAFILKRYYLLQYYLDYTKLFKTLQQLPELNQVYINQ 
QLEELTVSEVHKQVWENHKQKAFYE PLCEF I KESSQTLQL I DFD 
QNTVSDDSIKKILESISESKYHHYLRLNPSQSSSLIKSENEEIQ 
ELLKACDEKGVLVKAYYKFPLCLPTGTYYDYNSDRW 

FIG. 45 

MKILFEFIQDKLDIDLQTNSTYKENLKCGHFNGLDEILTTCFAL 
PNSRKIALPCLPGDLSHKAVIDHCII YLLTGELYNNVLTFGYKI 
ARNE D VNNS L F CH S ANVNVTL L KG AAW KM FH S L VGT Y AF VDL L I 
NYTVIQFNGQFFTQIVGNRCNEPHLPPKWVQRSSSSSATAAQIK 
QLTEPVTNKQFLHKLNINSSSFFPYSKILPSSSSIKKLTDLREA 
I FPTNLVKI PQRLKVRINLTLQKLLKRHKRLNYVS ILNS ICPPL 
EGTVLDLSHLSRQSPKERVLKFIIVILQKLLPQEMFGSKKNKGK 
IIPCNLNLLLSLPLNGYLPFDSLLKKLRLKDFRWLFISDIWFTKH 
NFENLNQLAICFISWLFRQLIPKIIQTFFYCTEISSTVTIVYFR 
HDTWNKL ITPF I VE YFKTYLVENNVCRNHNS YTLSNFNHSKMR I 
IPKKSNNEFRI IAIPCRGADEEEFTI YKENHKNAIQPTQKILEY 
LRNKRPTSFTKI YSPTQIADRIKEFKQRLLKKFNNVLiPELYFMK 
FDVKSCYDSIPRMECMRILKDALKNENGFFVRSQYFFNTNTGVL 
KLFNWNASRVPKPYELYIDNVRTVHLSNQDVINWEMEIFKTA 
LWVEDKCYIREDGLFQGSSLSAPIVDLVYDDLLEFYSEFKASPS 
QD TL I L KLAD DFLIISTDQQQVINI KKLAMGG FQ K YNAKANRD K 
ILAVSSQSDDDTVIQFCAMHIFVKELEVWKHSSTMNNFHIRSKS 
SKGIFRSLIALFNTRIS YKT I DTNLNS TNTVLMQ I DHWKN I S E 
CYKSAFKDLSINVTQNMQFHSFLQRI IEMTVSGCPITKCDPLIE 
YEVRFTI LNGFLESLSSNTSKFKDNI ILLRKEIQHLQAYI YI YI 
HIVN 
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1 tcaatactat taattaataa ataaaaaaaa 
61 ctaaaaaaag ccataggctc ctataggcaa 
121 tctagaagtt tacaaaagcc agattgagca 
181 ggaggatctc aagcttttaa agttcaaaaa 
241 tgatgatgat gaagaaaaca actcaaataa 
3 01 gattaagtag caagtttaat tgataaaaaa 

3 61 tttgaacgaa gatgaaaaca aaaagaatgg 
421 attaagaacg attactgaag aataggttaa 

4 81 ccagttagat ttaaatgaga gtggtggcca 
541 tactgaaaaa tggtttgaaa tatctcatga 
601 ctaaaagaca tcatattgtt ggtggcttaa 
661 tcttaatgta agcattaaca gactagaaac 
721 ttcacaaaca atcaaactta ctaataattc 
781 tgataataat ctctgtatac tcgcattgct 
841 tattttgaat ataagatctt cttatacaag 
901 gctacttgaa actatcttcg cagttgtctt 
961 acaagttcct tgcgaagcgt tctaatattt 

1021 agatagctaa ttataggtat actctttctc 
1081 agtccaagat tattttaagt tcttataaga 
1141 ggctatccca gttagtgcta ctaacgctgt 
1201 caagcatgct aatcttaatt tagtttctat 
1261 tgttaattta taacatttga aattagagtt 
1321 aaagcttgaa aatctacttt tgagtataaa 
13 81 aaacttttac acctacgttg cttaagaaac 
1441 aacaatcaaa aatctcaaaa acaataaaaa 
1501 aactccaagc gaaagcacaa gtggtatgaa 
1561 gcttgaagat ttcagcgtta acttgtaagc 
1621 acttttgatt agatcaacaa atttaaagaa 
1681 aaagagtaaa atggatacat tcatagatct 
1741 taaaagatgc tctgttaata tatcaaatcc 
1801 taaagattct actttttata aatttaagct 
1861 gtatactttt aagtagaacg aattttaatt 
1921 ttcctcatta gaaagcttag aagatattga 
1981 aaatttacaa aatgttaata ttatcgccag 
2041 tcctttcaat aagcccaatc ttctattttt 
2101 aaatgtatct atcaactgta ttcttgatca 
2161 agaaaagaat aaaaaaataa aagcattcat 
2221 tcttgattat actaaattat ttaaaacact 
2281 cattaattag caattagaag aattgactgt 
2341 ccacaagcaa aaagctttct atgaaccatt 
2401 cctttagcta atagattttg accaaaacac 
2461 agaatctata tctgagtcta agtatcatca 
2521 cagtttaatt aaatctgaaa acgaagaaat 
2581 aggtgtttta gtaaaagcat actataaatt 
2641 cgattacaat tcagatagat ggtgattaat 
2701 tgaatatttc tttgcttatt atttgaataa 
2761 atatatttta gttatttaat tcattatttt 
2821 aaaaaatcg 



gcaaactaca aagaaaatgt caaggcgtaa 
tgaaacaaat cttgattttg tattacaaaa 
ttataagacc tagtagtaat agatcaaaga 
ttaagattag gatggaaact ctggcaacga 
ataataagaa ttattaagga gagtcaatta 
agttggttct aaggtagaga aagatttgaa 
actttctgaa tagcaagtga aagaagagta 
gtattaaaat ttagtattta acatggacta 
tagaagacac agaagagaaa cagattatga 
ccaaaaaaat tatgtatcaa tttacgccaa 
agattatttt aataaaaaca attatgatca 
tgaagccgaa ttctatgcct ttgatgattt 
ttactagact gttaacatag acgttaattt 
tagattttta ttatcactag aaagattcaa 
aaattaatat aattttgaga aaattggtga 
ttctcatcgc cacttacaag gcattcattt 
agttaactcc tcatcataaa ttagcgttaa 
tacagactta aaattagttg acactaacaa 
attccctcgt ttgactcatg taagctagta 
agagaacctc aatgttttac ttaaaaaggt 
ccctacctaa ttcaattttg atttctactt 
tggattagaa ccaaatattt tgacaaaaca 
ataatcaaaa aatcttaaat ttttaagatt 
ctccagaaaa cagatattaa aacaagctac 
tcaagaagaa actcctgaaa ctaaagatga 
attttttgat catctttctg aattaaccga 
tacccaagaa atttatgata gcttgcacaa 
gttcaaatta agttacaaat atgaaatgga 
taagaatatt tatgaaacct taaacaatct 
tcatggaaac atttcttatg aactgacaaa 
gaccttaaac taagaattat aacacgctaa 
taataacgtt aaaagtgcaa aaattgaatc 
tagtctttgc aaatctattg cttcttgtaa 
tttgctctat cccaacaata tttagaaaaa 
caagcaattt gaataattga aaaatttgga 
gcatatactt aattctattt cagaattctt 
tttgaaaaga tattatttat tacaatatta 
tcaatagtta cctgaattaa attaagttta 
gagtgaagta cataagtaag tatgggaaaa 
atgtgagttt atcaaagaat catcctaaac 
tgtaagtgat gactctatta aaaagatttt 
ttatttgaga ttgaacccta gttaatctag 
ttaagaactt ctcaaagctt gcgacgaaaa 
ccctctatgt ttaccaactg gtacttatta 
taaatattag tttaaataaa tattaaatat 
tacatacaat agtcattttt agtgttttga 
aagtaaataa ttatttttca atcatttttt 
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Oxytricha 
Euplotes 



LCVSYILSSFYYANLEENALQFLRKESMDPEKPETNLLMRLT 
LCVSSILSSFYYATLEESSLGFLRDESMNPENPNVNLLMRLT 



FIG. 47 



ATTTATACTCATGAAAATCTTATTCGAGTTCATTCAAGACAAGCTTGACATTGATCTACA 
GACCAACAGTACTTACAAAGAAAATTTAAAATGTGGTCACTTCAATGGCCTCGATGAAAT 
TCTAACTACGTGTTTCGCACTACCAAATTCAAGAAAAATAGCATTACCATGCCTTCCTGG 
TGACTTAAGCCACAAAGCAGTCATTGATCACTGCATCATTTACCTGTTGACGGGCGAATT 
ATACAACAACGTACTAACATTTGGCTATAAAATAGCTAGAAATGAAGATGTCAACAATAG 
TCTTTTTTGCCATTCTGCAAATGTTAACGTTACGTTACTGAAAGGCGCTGCTTGGAAAAT 
GTTCCACAGTTTGGTCGGTACATACGCATTCGTTGATTTATTGATCAATTATACAGTAAT 
TCAATTTAATGGGCAGTTTTTCACTCAAATCGTGGGTAACAGATGTAACGAACCTCATCT 
GCCGCCCAAATGGGTCCAACGATCATCCTCATCATCCGCAACTGCTGCGCAAATCAAACA 
ACTTACAGAACCAGTGACAAATAAACAATTCTTACACAAGCTCAATATAAATTCCTCTTC 
TTTTTTTCCTTATAGCAAGATCCTTCCTTCATCATCATCTATCAAAAAGCTAACTGACTT 
GAGAGAAGCTATTTTTCCCACAAATTTGGTTAAAATTCCTCAGAGACTAAAGGTACGAAT 
TAATTTGACGCTGCAAAAGCTATTAAAGAGACATAAGCGTTTGAATTACGTTTCTATTTT 
GAATAGTATTTGCCCACCATTGGAAGGGACCGTATTGGACTTGTCGCATTTGAGTAGGCA 
ATCACCAAAGGAACGAGTCTTGAAATTTATCATTGTTATTTTACAGAAGTTATTACCCCA 
AGAAATGTTTGGCTCAAAGAAAAATAAAGGAAAAATTATCAAGAATCTAAATCTTTTATT 
AAGTTTACCCTTAAATGGCTATTTACCATTTGATAGTTTGTTGAAAAAGTTAAGATTAAA 
GGATTTTCGGTGGTTGTTCATTTCTGATATTTGGTTCACCAAGCACAATTTTGAAAACTT 
GAATCAATTGGCGATTTGTTTCATTTCCTGGCTATTTAGACAACTAATTCCCAAAATTAT 
ACAGACTTTTTTTTACTGCACCGAAATATCTTCTACAGTGACAATTGTTTACTTTAGACA 
TGATACTTGGAATAAACTTATCACCCCTTTTATCGTAGAATATTTTAAGACGTACTTAGT 
CGAAAACAACGTATGTAGAAACCATAATAGTTACACGTTGTCCAATTTCAATCATAGCAA 
AATGAGGATTATACCAAAAAAAAGTAATAATGAGTTCAGGATTATTGCCATCCCATGCAG 
AGGGG C AG ACGAAGAAGAATT CAC AATTTAT AAGGAGAAT CACAAAAATG CT AT C CAGC C 
CA.CTCAAAAAATTTTAGAATACCTAAGAAACAAAAGGCCGACTAGTTTTACTAAAATATA 
TTCTCCAACGCAAATAGCTGACCGTATCAAAGAATTTAAGCAGAGACTTTTAAAGAAATT 
TAATAATGTCTTACCAGAGCTTTATTTCATGAAATTTGATGTCAAATCTTGCTATGATTC 
CATACCAAGGATGGAATGTATGAGGATACTCAAGGATGCGCTAAAAAATGAAAATGGGTT 
TTTCGTTAGATCTCAATATTTCTTCAATACCAATACAGGTGTATTGAAGTTATTTAATGT 
TGTTAACGCTAGCAGAGTACCAAAACCTTATGAGCTATACATAGATAATGTGAGGACGGT 
TCATTTATCAAATCAGGATGTTATAAACGTTGTAGAGATGGAAATATTTAAAACAGCTTT 
GTGGGTTGAAGATAAGTGCTACATTAGAGAAGATGGTCTTTTTCAGGGCTCTAGTTTATC 
TGCTCCGATCGTTGATTTGGTGTATGACGATCTTCTGGAGTTTTATAGCGAGTTTAAAGC 
CAGTCCTAGCCAGGACACATTAATTTTAAAACTGGCTGACGATTTCCTTATAATATCAAC 
AGACCAACAGCAAGTGATCAATATCAAAAAGCTTGCCATGGGCGGATTTCAAAAATATAA 
TGCGAAAGCCAATAGAGACAAAATTTTAGCCGTAAGCTCCCAATCAGATGATGATACGGT 
TATTCAATTTTGTGCAATGCACATATTTGTTAAAGAATTGGAAGTTTGGAAACATTCAAG 
CACAATGAATAATTTCCATATCCGTTCGAAATCTAGTAAAGGGATATTTCGAAGTTTAAT 
AGCGCTGTTTAACACTAGAATCTCTTATAAAACAATTGACACAAATTTAAATTCAACAAA 
CACCGTTCTCATGCAAATTGATCATGTTGTAAAGAACATTTCGGAATGTTATAAATCTGC 
TTTTAAGGATCTATCAATTAATGTTACGCAAAATATGCAATTTCATTCGTTCTTACAACG 
CATCATTGAAATGACAGTCAGCGGTTGTCCAATTACGAAATGTGATCCTTTAATCGAGTA 
TGAGGTACGATTCACCATATTGAATGGATTTTTGGAAAGCCTATCTTCAAACACATCAAA 
ATTTAAAGATAATATCATTCTTTTGAGAAAGGAAATTCAACACTTGCAAGC 
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AKFLHWLMSVYWELLRSFFYVTETTFQKNRLFFYRKSVWSKLQSIGIRQHLKR 
VQLRDVSEAEVRQHREARPALLTSRLRFIPKPDGLRPIWMDYVVGARTFRREK 
RAERLTSRVKALFSVLNYERA 



FIG. 49 



GCCAAGTTCCTGCACTGGCTGATGAGTGTGTACGTCGTCGAGCTGCTCAGGTC 
TTTCTTTTATGTCACGGAGACCACGTTTCAAAAGAACAGGCTCTTTTTCTACC 
GGAAGAGTGTCTGGAGCAAGTTGCAAAGCATTGGAATCAGACAGCACTTGAAG 
AGGGTGCAGCTGCGGGACGTGTCGGAAGCAGAGGTCAGGCAGCATCGGGAAGC 
CAGGCCCGCCCTGCTGACGTCCAGACTCCGCTTCATCCCCAAGCCTGACGGGC 
TGCGGCCGATTGTGAACATGGACTACGTCGTGGGAGCCAGAACGTTCCGCAGA 
GAAAAGAGGGCCGAGCGTCTCACCTCGAGGGTGAAGGCACTGTTCAGCGTGCT 
CAACTACGAGCGGGCGCG 



MTEHHTPKSRILRFLENQYVYLCTLMDYVQLVLRGSPASSYSNICERLRSDVQTSFSIFLHSTWGF 
DSKPDEGVQFSSPKCSQSELIANWKQMFDESFERRRNLLMKGFSMNHEDFRAMHVNGVQNDLVSTF 
PNYLIS ILESKNWQLLLEI IGSDAMHYLLSKGSIFEALPNDNYLQISGIPLFKNNVFEETVSKKRKR 
TI ETS I TQNKS ARKEVS WNS I S I SRFS I FYRSS YKKFKQDL YFNLHS I CDRNTVHMWLQWI FPRQFG 
LINAFQVKQLHKVIPLVSQSTWPKRLLKVYPLIEQTAKRLHRISLSKVYNHYCPYIDTHDDEKILS 
YSLKPNQVFAFLRSILVRVFPKLIWGNQRIFEIILKDLETFLKLSRYESFSLHYLMSNIKISEIEWL 
VLGKRSNAKMCLSDFEKRKQIFAEFIYWLYNSFIIPILQSFFYITESSDLRNRTVYFRKDIWKLLCR 
PFITSMKMEAFEKINENNVRMDTQKTTLPPAVIRLLPKKNTFRLITNLRKRFLIKMGSNKKMLVSTN 
QTLRPVASILKHLINEESSGIPFNLEVYMKL,LTFKKDL,LKHRMFGRKKYFVRIDIKSCYDRIKQDLM 
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Wild Type Telomerase Gene 



Wild Type Telomerase Gene 



1 . Transform with linear fragment 
containing the telomerase gene 
disrupting with a LEU2 or ura4 marker 



M 



Telomerase Gene::M 



Wild Type Telomerase Gene 




Wild Type Telomerase Gene 



2. Assay in selective media 



3. Sporulate, and grow on 
selective media 



Telomerase Gene::M 



Wild Type (X2) 



Senescence? (X2) 



(These cells will show a senescence phenotype 

if the disrupted gene encodes a telomerase subunit) 



FIG. 65 
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heterozygote diploid - 
wt diploid - 
wt haploid- 



Tetrad 



tezIA 




Generations 
after sporulation 



Telomeric 
Apa I 
fragment 




600 bp 
500 bp 
400 bp 

300 bp 
200 bp 

100 bp 



FIG. 67 
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i 

met ser val tyr val val glu leu leu 
GCCAAGTTCCTGCACTGGCTG ATG AGT GTG TAC GTC GTC GAG CTG CTC 

10 20 
arg ser phe phe tyr val thr glu thr thr phe gin lys asn arg 
AGG TCT TTC TTT TAT GTC ACG GAG ACC ACG TTT CAA AAG AAC AGG 

30 

leu phe phe tyr arg lys ser val trp ser lys leu gin ser ile 
CTC TTT TTC TAC CGG AAG AGT GTC TGG AGC AAG TTG CAA AGC ATT 

40 50 
gly ile arg gin his leu lys arg val gin leu arg glu leu ser 
GGA ATC AGA CAG CAC TTG AAG AGG GTG CAG CTG CGG GAG CTG TCG 

60 

glu ala glu val arg gin his arg glu ala arg pro ala leu leu 
GAA GCA GAG GTC AGG CAG CAT CGG GAA GCC AGG CCC GCC CTG CTG 

70 80 
thr ser arg leu arg phe ile pro lys pro asp gly leu arg pro 
ACG TCC AGA CTC CGC TTC ATC CCC AAG CCT GAC GGG CTG CGG CCG 

90 

ile val asn met asp tyr val val gly ala arg thr phe arg arg 
ATT GTG AAC ATG GAC TAC GTC GTG GGA GCC AGA ACG TTC CGC AGA 

100 110 

glu lys ala glu arg leu thr ser arg val lys ala leu phe 

GAA AAG ARG GCC GAG CGT CTC ACC TCG AGG GTG AAG GCA CTG TTC 

120 

ser val leu asn tyr glu arg ala arg arg pro gly leu leu gly 
AGC GTG CTC AAC TAC GAG CGG GCG CGG CGC CCC GGC CTC CTG GGC 

130 140 

ala ser val leu gly leu asp asp ile his arg ala trp arg thr 
GCC TCT GTG CTG GGC CTG GAC GAT ATC CAC AGG GCC TGG CGC ACC 

150 

phe val leu arg val arg ala gin asp pro pro pro glu leu tyr 
TTC GTG CTG CGT GTG CGG GCC CAG GAC CCG CCG CCT GAG CTG TAC 

160 170 

phe val lys val asp val thr gly ala tyr asp thr ile pro gin 
TTT GTC AAG GTG GAT GTG ACG GGC GCG TAC GAC ACC ATC CCC CAG 

180 

asp arg leu thr glu val ile ala ser ile ile lys pro gin asn 
GAC AGG CTC ACG GAG GTC ATC GCC AGC ATC ATC AAA CCC CAG AAC 

190 200 

thr tyr cys val arg arg tyr ala val val gin lys ala ala met 
ACG TAC TGC GTG CGT CGG TAT GCC GTG GTC CAG AAG GCC GCC ATG 



FIG. 68A 
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gly thr ser 
GGC ACG TCC 

220 

gin gly ile 
GAG GGG ATC 



leu cys tyr 
CTG TGC TAC 

250 

arg asp gly 
CGG GAC GGG 



thr pro his 
ACA CCT CAC 

280 

arg gly val 
CGA GGT GTC 



val val asn 
GTG GTG AAC 

310 

phe val gin 
TTT GTT CAG 



leu leu asp 
CTG CTG GAT 

340 

tyr ala arg 
TAT GCC CGG 



phe lys ala 
TTC AAG GCT 

370 

arg leu lys 
CGG CTG AAG 



leu gin thr 
CTC CAG ACG 

400 

ala tyr arg 
GCG TAC AGG 



210 
ala arg pro 
GCA AGG CCT 



pro gin gly 
CCG CAG GGC 

240 

gly asp met 
GGC GAC ATG 



leu leu leu 
CTG CTC CTG 

270 

leu thr his 
CTC ACC CAC 



pro glu tyr 
CCT GAG TAT 

300 

phe pro val 
TTC CCT GTA 



met pro ala 
ATG CCG GCC 

330 

thr arg thr 
ACC CGG ACC 



thr ser ile 
ACC TCC ATC 

360 

gly arg asn 
GGG AGG AAC 



cys his ser 
TGT CAC AGC 

390 

val cys thr 
GTG TGC ACC 



phe his ala 
TTT CAC GCA 



ser arg ala 
TCA AGA GCC 



ser ile leu 
TCC ATC CTC 



glu asn lys 
GAG AAC AAG 



arg leu val 
CGT TTG GTG 



ala lys thr 
GCG AAA ACC 



gly cys val 
GGC TGC GTG 



glu asp glu 
GAA GAC GAG 



his gly leu 
CAC GGC CTA 



leu glu val 
CTG GAG GTG 



arg ala ser 
AGA GCC AGT 



met arg arg 
ATG CGT CGC 



leu phe leu 
CTG TTT CTG 



asn ile tyr 
AAC ATC TAC 



cys val leu 
TGT GTG CTG 



thr ser tyr 
ACG TCC TAC 

230 
ser thr leu 
TCC ACG CTG 



leu phe ala 
CTG TTT GCG 

260 
asp asp phe 
GAT GAT TTC 



phe leu arg 
TTC CTC AGG 

290 
val asn leu 
GTG AAC TTG 



ala leu gly 
GCC CTG GGT 

320 
phe pro trp 
TTC CCC TGG 



gin ser asp 
CAG AGC GAC 

350 
leu thr phe 
CTC ACC TTC 



lys leu phe 
AAA CTC TTT 

380 
asp leu gin 
GAT TTG CAG 



lys ile leu 
AAG ATC CTC 

410 
gin leu pro 
CAG CTC CCA 



val gin cys 
GTC CAG TGC 



leu cys ser 
CTC TGC AGC 



gly ile arg 
GGG ATT CGG 



leu leu val 
TTG TTG GTG 



thr leu val 
ACC CTG GTC 



arg lys thr 
CGG AAG ACA 



gly thr ala 
GGC ACG GCT 



cys gly leu 
TGC GGC CTG 



tyr ser ser 
TAC TCC AGC 



asn arg gly 
AAC CGC GGC 



gly val leu 
GGG GTC TTG 



val asn ser 
GTG AAC AGC 



leu leu gin 
CTG CTG CAG 



phe his gin 
TTT CAT CAG 



F/G. 68B 



83/103 



420 

gin val trp lys asn pro his phe ser cys ala ser ser leu thr 
CAA GTT TGG AAG AAC CCA CAT TTT TCC TGC GCG TCA TCT CTG ACA 

430 440 

arg leu pro leu leu leu his pro glu ser gin glu arg arg asp 
CGG CTC CCT CTG CTA CTC CAT CCT GAA AGC CAA GAA CGC AGG GAT 

450 

val ala gly gly gin gly arg arg arg pro ser ala leu arg gly 
GTC GCT GGG GGC CAA GGG CGC CGC CGG CCC TCT GCC CTC CGA GGC 

460 470 

arg ala val ala val pro pro ser ile pro ala gin ala asp ser 
CGT GCA GTG GCT GTG CCA CCA AGC ATT CCT GCT CAA GCT GAC TCG 

480 

thr pro cys his leu arg ala thr pro gly val thr gin asp ser 
ACA CCG TGT CAC CTA CGT GCC ACT CCT GGG GTC ACT CAG GAC AGC 

490 500 

pro asp ala ala glu ser glu ala pro gly asp asp ala asp cys 
CCA GAC GCA GCT GAG TCG GAA GCT CCC GGG GAC GAC GCT GAC TGC 

510 

pro gly gly arg ser gin pro gly thr ala leu arg leu gin asp 
CCT GGA GGC CGC AGC CAA CCC GGC ACT GCC CTC AGA CTT CAA GAC 

520 530 

his pro gly leu met ala thr arg pro gin pro gly arg glu gin 
CAT CCT GGA CTG ATG GCC ACC CGC CCA CAG CCA GGC CGA GAG CAG 

540 

thr pro ala ala leu ser arg arg ala tyr thr ser gin gly gly 
ACA CCA GCA GCC CTG TCA CGC CGG GCT TAT ACG TCC CAG GGA GGG 

550 560 

arg gly gly pro his pro gly leu his arg trp glu ser glu ala 
AGG GGC GGC CCA CAC CCA GGC CTG CAC CGC TGG GAG TCT GAG GCC 

564 
OP 

TGA GTGAGTGTTTGGCCGAGGCCTGCATGTCCGGCTGAAGGCTGAGTGTCCGGCTGAGGC 

CTGAGCGAGTGTCCAGCCAAGGGCTGAGTGTCCAGCACACCTGCGTTTTCACTTCCCCAC 

AGGCTGGCGTTCGGTCCACCCCAGGGCCAGCTTTTCCTCACCAGGAGCCCGGCTTCCACT 

CCCCACATAGGAATAGTCCATCCCCAGATTCGCCATTGTTCACCCTTCGCCCTGCCTTCC 

TTTGCCTTCCACCCCCACCATTCAGGTGGAGACCCTGAGAAGGACCCTGGGAGCTTTGGG 

AATTTGGAGTGACCAAAGGTGTGCCCTGTACACAGGCGAGGACCCTGCACCTGGATGGGG 

GTCCCTGTGGGTCAAATTGGGGGGAGGTGCTGTGGGAGTAAAATACTGAATATATGAGTT 

TTT CAGTTTTGGAAAAAAAAAAAAAAAAAAAAAAAAAA 
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Motif -1 
Ep pl23 
Sp Tezl 
Sc Est2 
Hs TCP1 
consensus 



. LWSLIRCFFYVTEQQKSYSKT . . . 
. FIIPILQSFFYITESSDLRNRT . . . 
. LIPKIIQTFFYCTEISSTVTIV. . . 
. YWELLRSFFYVTETTFQKNRL. . . 
FFY TE 



Motif 0 
Ep p!23 
Sp Tezl 
Sc Est2 
Hs TCP1 
consensus 



K 

p hhh K hR h R 

. KSLGFAPGKLRLI PKKT - - TFRPIMTFNKKI V 
. QKTTLPPAVIRLLPKKN- -TFRLITNLRKRFL 
. TLSNFNHSKMRI I PKKSNNEFRI IAI PCRGAD 
. ARPALLTSRLRFI PKPD - - GLRP I VNMDYWG 
R PK R I 



Motif A 
Ep pl23 
Sp Tezl 
Sc Est2 
Hs TCP1 
consensus 



AF 

h tiDh GY h 
. PKLFFATMDIEKCYDSVNREKLSTFLK . 
. RKKYFVRIDIKSCYDRIKQDLMFRI VK . 
, PELYFMKFDVKSCYDSIPRMECMRILK. 
> PELYFVKVDVTGAYDTI PQDRLTEVIA . 

F D YD 



.// 



Motif B 
Ep pl23 
Sp Tezl 
Sc Est2 
Hs TCP1 
consensus 



hPQG pS hh 
. NGKF YKQTKGI PQGLCVS SILSS F Y YA . 
. GNSQYLQKVGIPQGSILSSFLCHFYME . 
. EDKC Y I REDGLFQGS S LSAP I VDLVYD . 
. RATSYVQCQGIPQGSILSTLLCSLCYG . 
G QG S 



Motif C 
Ep pl23 
Sp Tezl 
Sc Est2 
Hs TCP1 
consensus 



h F DD hhh 
. PNVNLLMRLTDD YLL I TTQENN . 
. KKGSVLLRWDDFLFITWKKD . 
. SQDTLILKLADDFLI ISTDQQQ . 
. RRDGLLLRLVDDFLLVTPHLTH , 
DD L 



Motif D 
Ep pl23 
Sp Tezl 
Sc Est2 
Hs TCP1 
consensus 



Gh h cK 
. NVS RENGFKFNMKKL . 
. LNLSLRGFEKHNFST . 
. KKLAMGGFQKYNAKA . 
. LRTLVRGVPEYGCW . 

G 



F/G. 69 
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1 GCAGCGCTGC GTCCTGCTGC GCACGTGGGA AGCCCTGGCC CCGGCCACCC 

51 CCGCGATGCC GCGCGCTCCC CGCTGCCGAG CCGTGCGCTC CCTGCTGCGC 

101 AGCCACTACC GCGAGGTGCT GCCGCTGGCC ACGTTCGTGC GGCGCCTGGG 

151 GCCCCAGGGC TGGCGGCTGG TGCAGCGCGG GGACCCGGCG GCTTTCCGCG 

2 01 CGNTGGTGGC CCANTGCNTG GTGTGCGTGC CCTGGGANGN ANGGCNGCCC 
251 CCCGCCGCCC CCTCCTTCCG CCAGGTGTCC TGCCTGAANG ANCTGGTGGC 

3 01 CCGAGTGCTG CANANGCTGT GCGAJSTCGCGG CGCGAANAAC GTGCTGGCCT 
3 51 TCGGCTTCGC GCTGCTGGAC GGGGCCCGCG GGGGCCCCCC CGAGGCCTTC 
401 ACCACCAGCG TGCGCAGCTA CCTGCCCAAC ACGGTGACCG ACGCACTGCG 
451 GGGGAGCGGG GCGTGGGGGC TGCTGCTGCG CCGCGTGGGC GACGACGTGC 
501 TGGTTCACCT GCTGGCACGC TGCGCGNTNT TTGTGCTGGT GGNTCCCAGC 
551 TGCGCCTACC ANGTGTGCGG GCCGCCGCTG TACCAGCTCG GCGCTGCNAC 
6 01 TCAGGCCCGG CCCCCGCCAC ACGCTANTGG ACCCGAANGC GTCTGGGATC 
651 CAACGGGCCT GGAAC CAT AG CGTCAGGGAG GCCGGGGTCC CCCTGGGCTG 
701 CCAGCCCCGG GTGCGAGGAG GCGCGGGGGC AGTGCCAGCC GAAGTCTGCC 
751 GTTGCCCAAG AGGCCCAGGC GTGGCGCTGC CCCTGAGCCG GAGCGGACGC 
8 01 CCGTTGGGCA GGGGTCCTGG GCCCACCCGG GCAGGACGCC TGGACCGAGT 
851 GACCGTGGTT TCTGTGTGGT GTCACCTGCC AGACCCGCCG AAGAAG C C AC 
901 CTCTTTGGAG GGTGCGCTCT CTGGCACGCG CCACTCCCAC CCATCCGTGG 
951 GCCGCCAGCA CCACGCGGGC CCCCCATCCA CATCGCGGCC ACCACGTCCT 

1001 GGGACACGCC TTGTCCCCCG GTGTACGCCG AGACCAAGCA CTTCCTCTAC 

1051 TCCTCAGGCG ACAAGNACAC TGCGNCCCTC CTTCCTACTC AATATATCTG 

1101 AGGCCCAGCC TGACTGGCGT TCGGGAGGTT CGTGGAGACA NTCTTTCTGG 

1151 TTCCAGGCCT TGGATGCCAG GATTCCCCGC AGGTTGCCCC GCCTGCCCCA 

12 01 GCGNTACTGG CAAATGCGGC CCCTGTTTCT GGAGCTGCTT GGGAACCACG 
1251 CGCAGTGCCC CTACGGGGTG TTCCTCAAGA CGCACTGCCC GCTGCGAGCT 

13 01 GCGGTCACCC CAGCAGCCGG TGTCTGTGCC CGGGAGAAGC CCCAGGGCTC 

13 51 TGTGGCGGCC CCCGAGGAGG AGGAACACAG ACCCCCGTCG CCTGGTGCAG 

14 01 CTGCTCCGCC AG C AC AG C AG CCCCTGGCAG GTGTACGGCT TCGTGCGGGC 
1451 CTGCCTGCGC CGGCTGGTGC CCCCAGGCCT CTGGGGCTCC AGGCACAACG 
1501 AACGCCGCTT CCTCAGGAAC AC C AAGAAG T TCATCTCCCT GGGGAAGCAT 
1551 GCCAAGCTCT CGCTGCAGGA GCTGACGTGG AAGATGAGCG TGCGGGACTG 
16 01 CGCTTGGCTG CGCAGGAGCC CAGGGGTTGG CTGTGTTCCG GCCGCAGAGC 
16 51 ACCGTCTGCG T G AGG AG AT C CTGGCCAAGT TCCTGCACTG GCTGATGAGT 
1701 GTGTACGTCG TCGAGCTGCT CAGGTCTTTC TTTTATGTCA CGGAGACCAC 
1751 GTTTCAAAAG AACAGGCTCT TTTTCTACCG GAAGAGTGTC TGGAGCAAGT 
18 01 TGCAAAGCAT TGGAATCAGA CAGCACTTGA AGAGGGTGCA GCTGCGGGAG 
1851 CTGTCGGAAG C AG AGGT C AG GCAGCATCGG GAAGCCAGGC CCGCCCTGCT 
1901 GACGTCCAGA CTCCGCTTCA TCCCCAAGCC TGACGGGCTG CGGCCGATTG 
1951 TGAACATGGA CTACGTCGTG GGAGCCAGAA CGTTCCGCAG AGAAAAGAGG 
2 001 GCCGAGCGTC TCACCTCGAG GGTGAAGGCA CTGTTCAGCG TGCTCAACTA 
2 051 CGAGCGGGCG CGGCGCCCCG GCCTCCTGGG CGCCTCTGTG CTGGGCCTGG 
2101 ACGATATCCA CAGGGCCTGG CGCACCTTCG TGCTGCGTGT GCGGGCCCAG 
2151 GACCCGCCGC CTGAGCTGTA CTTTGTCAAG GTGGATGTGA CGGGCGCGTA 

22 01 CGACACCATC CCCCAGGACA GGCTCACGGA GGTCATCGCC AGCATCATCA 
2251 AACCCCAGAA CACGTACTGC GTGCGTCGGT ATGCCGTGGT CCAGAAGGCC 

23 01 GCCCATGGGC ACGTCCGCAA GGCCTTCAAG AGCCACGTCT CTACCTTGAC 

23 51 AGACCTCCAG CCGTACATGC GACAGTTCGT GGCTCACCTG CAGGANAACA 

24 01 GCCCGCTGAG GGATGCCGTC GT CAT CGAG C AGAGCTCCTC CCTGAATGAG 
24 51 GCCAGCAGTG GCCTCTTCGA CGTCTTCCTA CGCTTCATGT GCCACCACGC 
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2 501 CGTGCGCATC AGGGGCAAGT CCTACGTCCA GTGCCAGGGG ATCCCGCAGG 

2 551 GCTCCATCCT CTCCACGCTG CTCTGCAGCC TGTGCTACGG CGACATGGAG 

26 01 AACAAGCTGT TTGCGGGGAT TCGGCGGGAC GGGCTGCTCC TGCGTTTGGT 

2651 GGATGATTTC TTGTTGGTGA CACCTCACCT CACCCACGCG AAAACCTTCC 

2 7 01 TCAGGACCCT GGTCCGAGGT GTCCCTGAGT ATGGCTGCGT GGTGAACTTG 

2 751 CGGAAGACAG TGGTGAACTT CCCTGTAGAA GACGAGGCCC TGGGTGGCAC 

2801 GGCTTTTGTT CAGATGCCGG CCCACGGCCT ATTCCCCTGG TGCGGCCTGC 

2 851 TGCTGGATAC CCGGACCCTG GAGGTGCAGA GCGACTACTC CAGCTATGCC 

2 901 CGGACCTCCA TCAGAGCCAG TCTCACCTTC AACCGCGGCT TCAAGGCTGG 

2 951 GAGGAACATG CGTCGCAAAC TCTTTGGGGT CTTGCGGCTG AAGTGT CACA 

3 0 01 GCCTGTTTCT GGATTTGCAG GTGAACAGCC TCCAGACGGT GTGCACCAAC 
3 051 ATCTACAAGA TCCTCCTGCT GCAGGCGTAC AGGTTTCACG CATGTGTGCT 
3101 GCAGCTCCCA TTTCATCAGC AAGTTTGGAA GAACCCCACA TTTTTCCTGC 
3151 GCGTCATCTC TGACACGGCC TCCCTCTGCT ACTCCATCCT GAAAGCCAAG 
3 2 01 AACGCAGGGA TGTCGCTGGG GGCCAAGGGC GCCGCCGGCC CTCTGCCCTC 
3 251 CGAGGC CGTG CAGTGGCTGT GCCACCAAGC ATTCCTGCTC AAGCTGACTC 
33 01 GACACCGTGT CAC CTACGTG CCACTCCTGG GGTCACTCAG GACAGCCCAG 

33 51 ACGCAGCTGA GTCGGAAGCT CCCGGGGACG ACGCTGACTG CCCTGGAGGC 

34 01 CGCAGCCAAC CCGGCACTGC CCTCAGACTT C AAG AC CATC CTGGACTGAT 
34 51 GGCCACCCGC CCACAGCCAG GCCGAGAGCA GACAC CAGCA GCCCTGTCAC 
3 5 01 GCCGGGCTCT ACGTCCCAGG GAGGGAGGGG CGGCCCACAC CCAGGCCCGC 
3 551 ACCGCTGGGA GTCTGAGGCC TGAGTGAGTG TTTGGCCGAG GCCTGCATGT 
3 6 01 CCGGCTGAAG GCTGAGTGTC CGGCTGAGGC CTGAGCGAGT GTCCAGCCAA 
3 6 51 GGGCTGAGTG TCCAGCACAC CTGCCGTCTT CACTTCCCCA CAGGCTGGCG 
3 7 01 CTCGGCTCCA CCCCAGGGCC AGCTTTTCCT CACCAGGAGC CCGGCTTCCA 
3 751 CTCCCCACAT AGGAATAGTC CATCCCCAGA TTCGCCATTG TTCACCCCTC 
3 8 01 GCCCTGCCCT CCTTTGCCTT CCACCCCCAC CAT C C AGGTG GAGACCCTGA 
3 851 GAAGGACCCT GGGAG CTCTG GGAATTTGGA GTGAC CAAAG GTGTGCCCTG 
3 901 TACACAGGCG AGGACCCTGC ACCTGGATGG GGGTCCCTGT GGGTCAAATT 
3 951 GGGGGGAGGT GCTGTGGGAG TAAAATACTG AATATATGAG TTTTTCAGTT 
4001 TTGAAAAAAA AAAAAAAAAA AAAAAAAAA 
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GCAGCGCTGCGTCCTGCTGCGCACGTGGGAAGCCCTGGCCCCGGCCACCCCCGCGATGCC 
! + + + + + + 60 

CGTCGCGACGCAGGACGACGCGTGCACCCTTCGGGACCGGGGCCGGTGGGGGCGCTACGG 

a AALRPAAHVGS PGPGHPRDA 

b QRCVLLRTWEALAPATPAMP- 

c SAASCCARGKPWPRPPPRCR- 

GCGCGCTCCCCGCTGCCGAGCCGTGCGCTCCCTGCTGCGCAGCCACTACCGCGAGGTGCT 
gl + + + + + + 120 

CGCGCGAGGGGCGACGGCTCGGCACGCGAGGGACGACGCGTCGGTGATGGCGCTCCACGA 



a 
b 
c 



ARS PLPSRALPAAQPLPRGA 
RAPRCRAVRSLLRSHYREVL 
AL PAAE PCAPCCAATTARCC 



GCCGCTGGCCACGTTCGTGCGGCGCCTGGGGCCCCAGGGCTGGCGGCTGGTGCAGCGCGG 

121 + + + + + + 180 

CGGCGACCGGTGCAAGCACGCCGCGGACCCCGGGGTCCCGACCGCCGACCACGTCGCGCC 



a 
b 
c 



AAGHVRAAPGAPGLAAGAAR 
PLATFVRRLGPQGWRLVQRG 
RW PRS CGAWGPRAGGWC SAG- 



GGACCCGGCGGCTTTCCGCGCGNTGGTGGCCCANTGCNTGGTGTGCGTGCCCTGGGANGN 

181 + + 4- + + + 240 

CCTGGGCCGCCGAAAGGCGCGCNACCACCGGGTNACGNACCACACGCACGGGACCCTNCN 



a 
b 
c 



GPGGFPR?GGP? ? GVRALG ? 
DPAAFRA?VA?C?VCVPW? ? 
TRRLSARWWP7AWCACPG? ? 



ANGGCNGCCCCCCGCCGCCCCCTCCTTCCGCCAGGTGTCCTGCCTGAANGANCTGGTGGC 

241 + 4- 4- + + + 300 

TNCCGNCGGGGGGCGGCGGGGGAGGAAGGCGGTCCACAGGACGGACTTNCTNGACCACCG 



a 
b 
c 



7AAPRRPLLPPGVLPE? ?GG 
? ? PPAAPSFRQVSCL? ?LVA- 
G? PPPPPPSARCPA* ? ?WWP- 



CCGAGTGCTGCANANGCTGTGCGANCGCGGCGCGAANAACGTGCTGGCCTTCGGCTTCGC 

301 + 4- + 4- 4- + 360 

GGCTCACGACGTNTNCGACACGCTNGCGCCGCGCTTNTTGCACGACCGGAAGCCGAAGCG 



a 
b 
c 



PSAA?AVR?RRE?RAGLRLR 
RVL? ? LC ?RGA?NVLAFGFA 
ECC? ? CA?AAR?TCWPSASR 



GCTGCTGGACGGGGCCCGCGGGGGCCCCCCCGAGGCCTTCACCACCAGCGTGCGCAGCTA 
CGACGACCTGCCCCGGGCGCCCCCGGGGGGGCTCCGGAAGTGGTGGTCGCACGCGTCGAT 



a 
b 
c 



AAGRGPRGPPRGLHHQRAQL 
LLDGARGGPPEAFTTSVRSY 
CWTGPAGAPPRPS PPACAAT 



CCTGCCCAACACGGTGACCGACGCACTGCGGGGGAGCGGGGCGTGGGGGCTGCTGCTGCG 

421 4- + 4- 4- 4- 4- 480 

GGACGGGTTGTGCCACTGGCTGCGTGACGCCCCCTCGCCCCGCACCCCCGACGACGACGC 



a 
b 
c 



PAQHGDRRTAGERGVGAAAA 
LPNTVTDALRGSGAWGLLLR- 
CPTR* PTHCGGAGRGGCCCA- 
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a PRGRRRAGSPAGTLR? ? CAG 

b RVGDDVLVHLLARCA? FVLV 

c AWAT T C W F T C WHAAR ? L C W W - 

GGNTCCCAGCTGCGCCTACCANGTGTGCGGGCCGCCGCTGTACCAGCTCGGCGCTGCNAC 

541 + + + + + + 600 

CCNAGGGTCGACGCGGATGGTNCACACGCCCGGCGGCGACATGGTCGAGCCGCGACGNTG 

a GSQLRL P 7VRAAAVPARRC? 

b ?PSCAY?VCGPPLYQLGAAT- 

c ? PAAPT ? CAGRRCTSSAL ? L- 

TCAGGCCCGGCCCCCGCCACACGCTANTGGACCCGAANGCGTCTGGGATCCAACGGGCCT 

601 + 4- + + + + 660 

AGTCCGGGCCGGGGGCGGTGTGCGATNACCTGGGCTTNCGCAGACCCTAGGTTGCCCGGA 

a SGPAPATR?WTR?RLGSNGP 

b QARPPPHA7GPE ?VWDPTGL 

c RPGPRHTL?DP?ASGIQRAW- 

GGAACCATAGCGTCAGGGAGGCCGGGGTCCCCCTGGGCTGCCAGCCCCGGGTGCGAGGAG 

661 + 4- + + + + 720 

CCTTGGTATCGCAGTCCCTCCGGCCCCAGGGGGACCCGACGGTCGGGGCCCACGCTCCTC 

a GTIASGRPGSPWAASPGCEE 

b EP*RQGGRGPPGLPAPGARR- 

C NHSVREAGVPLGCQPRVRGG- 

GCGCGGGGGCAGTGCCAGCCGAAGTCTGCCGTTGCCCAAGAGGCCCAGGCGTGGCGCTGC 

721 + + + + + + 780 

CGCGCCCCCGTCACGGTCGGCTTCAGACGGCAACGGGTTCTCCGGGTCCGCACCGCGACG 

a ARGQCQ P KSAVAQEAQAWRC 

b RGGSASRSLPLPKRPRRGAA 

c AGAVPAEVCRC PRGPGVAL P- 

CCCTGAGCCGGAGCGGACGCCCGTTGGGCAGGGGTCCTGGGCCCACCCGGGCAGGACGCC 

781 + 4- + + + + 840 

GGGACTCGGCCTCGCCTGCGGGCAACCCGTCCCCAGGACCCGGGTGGGCCCGTCCTGCGG 

a P * AGADARWAGVLG PPGQDA 

b PEPERTPVGQGSWAHPGRTP- 

c LSRSGRPLGRGPGPTRAGRL- 

TGGACCGAGTGACCGTGGTTTCTGTGTGGTGTCACCTGCCAGACCCGCCGAAGAAGCCAC 

841 + + 4- 4- 4- 4- 900 

ACCTGGCTCACTGGCACCAAAGACACACCACAGTGGACGGTCTGGGCGGCTTCTTCGGTG 

a WTE* PWFLCGVTCQTRRRSH 

b GPSDRGFCVVSPARPAEEAT 

C DRVTVVSVWCHLPDPPKKPP- 

CTCTTTGGAGGGTGCGCTCTCTGGCACGCGCCACTCCCACCCATCCGTGGGCCGCCAGCA 

901 4- 4- 4- 4- 4- 4- 960 

GAGAAACCTCCCACGCGAGAGACCGTGCGCGGTGAGGGTGGGTAGGCACCCGGCGGTCGT 

a LFGGCALWHAPLPPIRGPPA 

b SLEGALSGTRHSHPSVGRQH 

C LWRVRS LARATPTHPWAAST- 

CCACGCGGGCCCCCCATCCACATCGCGGCCACCACGTCCTGGGACACGCCTTGTCCCCCG 
961 + + + + + + 1020 

GGTGCGCCCGGGGGGTAGGTGTAGCGCCGGTGGTGCAGGACCCTGTGCGGAACAGGGGGC 
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a 
b 
c 



a 
b 
c 



a 
b 
c 



a 
b 
c 



a 
b 
c 



a 
b 
c 



a 
b 
c 



a 
b 
c 
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PRGPPIHIAATTSWDTPCPP 
HAGPPSTSRPPRPGTRLVPR- 
TRAPH PHRGHHVLGHALS PG- 

GTGTACGCCGAGACCAAGCACTTCCTCTACTCCTCAGGCGACAAGNACACTGCGISrCCCTC 

1021 -f + + + + + 1080 

CACATGCGGCTCTGGTTCGTGAAGGAGATGAGGAGTCCGCTGTTClSrrGTGACGCNGGGAG 

VYAETKHFLYSSGDK?TA?L 
CTPRPSTSSTPQAT? TLRPS 
VRRDQALPLLLRRQ ? HC ? P P - 

CTTCCTACTCAATATATCTGAGGCCCAGCCTGACTGGCGTTCGGGAGGTTCGTGGAGACA 

1081 + + + + + + 1140 

GAAGGATGAGTTATATAGACTCCGGGTCGGACTGACCGCAAGCCCTCCAAGCACCTCTGT 

LPTQYI *GPA*LAFGRFVET 
FLLNISEAQPDWRSGGSWR? - 
SYS IYLRPSLTGVREVRGD ? - 

NTCTTTCTGGTTCCAGGCCTTGGATGCCAGGATTCCCCGCAGGTTGCCCCGCCTGCCCC^ 

1141 + + + + + + 1200 

NAGAAAGACCAAGGTCCGGAACCTACGGTCCTAAGGGGCGTCCAACGGGGCGGACGGGGT 

?FLVPGLGCQDSPQVAPPAP 
SFWFQALDARIPRRLPRLPQ- 
LSGSRPWMPGFPAGCPACPS- 

GCGOTACTGGCAAATGCGGCCCCTGTTTCTGGAGCTGCTTGGGAACCACGCGCAGTGCCC 

1201 + + + + + + 1260 

CGCNATGACCGTTTACGCCGGGGACAAAGACCTCGACGAACCCTTGGTGCGCGTCACGGG 

A ? LANAAPVSGAAWE PRAV.P 
RYWQMRPLFLELLGNHAQCP 
7TGKCGPCFWSCLGTTRSAP- 

CTACGGGGTGTTCCTCAAGACGCACTGCCCGCTGCGAGCTGCGGTCACCCCAGCAGCCGG 

1261 + + + + + + 1320 

GATGCCCCACAAGGAGTTCTGCGTGACGGGCGACGCTCGACGCCAGTGGGGTCGTCGGCC 

LRGVPQDALPAASCGHPSSR 
YGVFLKTHC PLRAAVTPAAG 
TGCS SRRTARCELRS PQQ PV- 

TGTCTGTGCCCGGGAGAAGCCCCAGGGCTCTGTGGCGGCCCCCGAGGAGGAGGAACACAG 

1321 + + + + + + 1380 

ACAGACACGGGCCCTCTTCGGGGTCCCGAGACACCGCCGGGGGCTCCTCCTCCTTGTGTC 

CLC PGEAPGLCGGPRGGGTQ.- 
VCAREKPQGSVAAPEEEEHR- 
SVPGRS P RALWRP PRRRNTD- 

ACCCCCGTCGCCTGGTGCAGCTGCTCCGCCAGCACAGCAGCCCCTGGCAGGTGTACGGCT 

1381 + + + + + + 1440 

TGGGGGCAGCGGACCACGTCGACGAGGCGGTCGTGTCGTCGGGGACCGTCCACATGCCGA 

TPVAWCSCSASTAAPGRCTA 
PPS PGAAAPPAQQPLAGVRL 
PRRLVQLLRQHSS PWQVYGF- 

TCGTGCGGGCCTGCCTGCGCCGGCTGGTGCCCCCAGGCCTCTGGGGCTCCAGGCACAACG 

1441 + + + + + + 1500 

AGCACGCCCGGACGGACGCGGCCGACCACGGGGGTCCGGAGACCCCGAGGTCCGTGTTGC 
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a SCGPACAGWCPQASGAPGTT 
b RAGLPAPAGAPRPLGLQAQR 
c VRACLRRLVPPGLWGSRHNE- 

AACGCCGCTTCCTC^GGAACACCAAGAAGTTCATCTCCCTGGGGAAGC^ 

1501 + + + + + + 1560 

TTGCGGCGAAGGAGTCCTTGTGGTTCTTCAAGTAGAGGGACCCCTTCGTACGGTTCGAGA 

a NAASSG'TPRSSSPWGSMPSS 

b TPLPQEHQEVHLPGEACQAL- 

C RRFLRNTKKF I SLGKHAKL S - 



CGCTGCAGGAGCTGACGTGGAAGATGAGCGTGCGGGACTGCGCTTGGCTGCGCAGGAGCC 

1561 + + + + + + 1620 

GCGACGTCCTCGACTGCACCTTCTACTCGCACGCCCTGACGCGAACCGACGCGTCCTCGG 



a 
b 
c 



RCRS*RGR*ACGTALGCAGA 
AAGADVEDERAGLRLAAQEP 
LQELTWKMSVRDCAWLRRSP 



CAGGGGTTGGCTGTGTTCCGGCCGCAGAGCACCGTCTGCGTGAGGAGATCCTGGCCAAGT 

1621 + + + + + + 1680 

GTCCCCAACCGACACAAGGCCGGCGTCTCGTGGCAGACGCACTCCTCTAGGACCGGTTCA 



b 
c 



QGLAVFRPQSTVCVRRSWPS 
RGWLCSGRRAPSA*GDPGQV 
GVGCVPAAEHRLREE ILAKF 



TCCTGCACTGGCTGATGAGTGlXjTACGTCGTCGAGCTGCTCAGGTCTTTClUU u iATGTCA 

1681 + + + + + + 1740 

AGGACGTGACCGACTACTCACACATGCAGCAGCTC 



a 
b 
c 



SCTG**VCTSSSCSGLSFMS 
PALADECVRRRAAQVFLLCH 
LHWLMSVYVVELLRS FFYVT- 



CGGAGACC^CGTTTCAAAAGAAC^GGCTCTTTTTCTACCGGAAGAGTGTCTGGAGCAAGT 

1741 + + + + + + 1800 

GCCTCTGGTGCAAAGTTTTCTTGTCCGAGAAAAAGATGGCCTTCTCACAGACCTCGTTCA 



a 
b 

c 



RRPRFKRTGSFSTGRVSGAS 
GDHVSKEQALFLPEECLEQV 
ETTFQKNRLFFYRKSVWSKL 



TGCAAAGCATTGGAATCAGACAGCACTTGAAGAGGGTGCAGCTGCGGGAGCTGTCGGAAG 

1801 + + + + + + 1860 

ACGTTTCGTAACCTTAGTCTGTCGTGAACTTCTCCCACGTCGACGCCCTCGACAGCCTTC 



a 
b 
c 



CKALESDST*RGCSCGSCRK 
AKHWNQTALEEGAAAGAVGS 
QSIGIRQHLKRVQLRELSEA 



CAGAGGTCAGGCAGCATCGGGAAGCCAGGCCCGCCCTGCTGACGTCCAGACTCCGCTTCA 

1861 + + + + + + 1920 

GTCTCCAGTCCGTCGTAGCCCTTCGGTCCGGGCGGGACGACTGCAGGTCTGAGGCGAAGT 



a 
b 
c 



QRSGSIGKPGPPC*RPDSAS 
RGQAASGSQARPADVQTPLH 
EVRQHREARPALLTSRLRFI 



TCCCCAAGCCTGACGGGCTGCGGCCGATTGTGAACATGGACTACGTCGTGGGAGCCAGAA 

1921 + + + + + + 1980 

AGGGGTTCGGACTGCCCGACGCCGGCTAACACTTGTACCTGATGCAGCACCCTCGGTCTT 
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a SPSLTGCGRL*TWTTSWEPE 

b P Q A * RAAADCEHGLRRGSQN 

C PKPDGLRP IVNMDYVVGART- 

CGTTCCGCAGAGAAAAGAGGGCCGAGCGTCTCACCTCGAGGGTGAAGGCACTGTTCAGCG 

1981 + + + + + + 2040 

GC^GGCGTCTCTTTTCTCCCGGCTCGC^GAGTGGAGCTCCC^CTTCCGTGACTUVGTCG^ 

a RSAEKRGPSVS PRG*RHCSA 

b VPQRKEGRASHLEGEGTVQR 

C FRREKRAERLTSRVKALFSV- 

TGCTCAACTACGAGCGGGCGCGGCGCCCCGGCCTCCTGGGCGCCTCTGTGCTGGGCCTGG 

2041 + + + + + + 2100 

ACGAGTTGATGCTCGCCCGCGCCGCGGGGCCGGAGGACCCGCGGAGACACGACCCGGACC 

a CSTTSGRGAPASWAPLCWAW 

b AQLRAGAAPRPPGRLCAGPG- 

c LNYERARRPGLLGASVLGLD- 

ACGATATCCACAGGGCCTGGCGCACCTTCGTGCTGCGTGTGCGGGCCCAGGACCCGCCGC 

2101 + + + + + + 2160 

TGCTATAGGTGTCCCGGACCGCGTGGAAGCACGACGCACACGCCCGGGTCCTGGGCGGCG 

a TISTGPGAPSCCVCGPRTRR 

b RYPQGLAHLRAACAGPGPAA- 

C DIHRAWRTFVLRVRAQDPPP- 

CTGAGCTGTACTTTGTCAAGGTGGATGTGACGGGCGCGTACGACACCATCCCCCAGGACA 

2161 + + + + + + 2220 

GACTCGACATGAAACAGTTCCACCTACACTGCCCGCGCATGCTGTGGTAGGGGGTCCTGT 

a LSCTLSRWM*RARTTPSPRT 

b *AVLCQGGCDGRVRHHPPGQ 

C ELYFVKVDVTGAYDTIPQDR- 

GGCTCACGGAGGTCATCGCCAGCATCATCAAACCCCAGAACACGTACTGCGTGCGTCGGT 

2221 + + + + + + 2280 

CCGAGTGCCTCCAGTAGCGGTCGTAGTAGTTTGGGGTCTTGTGCATGACGCACGCAGCCA 

a GSRRS S PASSNPRTRTACVG 

b AHGGHRQHHQTPEHVLRASV- 

c LTEVIAS I I KPQNTYCVRRY- 

ATGCCGTGGTCCAGAAGGCCGCCCATGGGCACGTCCGCAAGGCCTTCAAGAGCCACGTCT 

2281 + + + + + + 2340 

TACGGCACCAGGTCTTCCGGCGGGTACCCGTGCAGGCGTTCCGGAAGTTCTCGGTGCAGA 

a MPWSRRPPMGTSARPSRATS 

b CRGPEGRPWARPQGLiQEPRL 

C AVVQ KAAHGHVRKAFKSHVS- 

CTACCTTGACAGACCTCC^GCCGTACATGCGACAGTTCGTGGCTCACCTGCAGGANAACA 

2341 + + + + + + 2400 

GATGGAACTGTCTGGAGGTCGGCATGTACGCTGTCAAGCACCGAGTGGACGTCCTNTT 

a LP*QTSSRTCDSSWLTCR?T 

b YLDRPPAVHATVRGSPAG?Q 

C TLTDLQ PYMRQFVAHLQ ?NS- 

GCCCGCTGAGGGATGCCGTCGTCATCGAGCAGAGCTCCTCCCTGAATGAGGCCAGCAGTG 

2401 + + + + + + 2460 

CGGGCGACTCCCTACGGCAGCAGTAGCTCGTCTCGAGGAGGGACTTACTCCGGTCGTCAC 



+ 
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a AR*GMPSSSSRAPP*MRPAV 

b PAEGCRRHRAELLPE*GQQW- 

c PLRDAVVI EQSSSLNEASSG- 

GCCTCTTCGACGTCTTCCTACGCTTCATGTGCCACCACGCCGTGCGCATCAGGGGCAAGT 

2461 + + + + + + 2520 

CGGAGAAGCTGCAGAAGGATGCGAAGTACACGGTGGTGCGGCACGCGTAGTCCCCGTTCA 

a ASSTSSYASCATTPCASGAS 

b PLRRLPTLHVPPRRAHQGQV- 

C LFDVFLRFMCHHAVR IRGKS- 

CCTACGTCCAGTGCCAGGGGATCCCGCAGGGCTCCATCCTCTCCACGCTGCTCTGCAGCC 

2521 + + + + + + 2580 

GGATGCAGGTCACGGTCCCCTAGGGCGTCCCGAGGTAGGAGAGGTGCGACGAGACGTCGG 

a PTSSARGSRRAPSSPRCSAA 

b LRPVPGDPAGLHPLHAALQP- 

c YVQCQGI PQGS ILSTLLCSL- 

TGTGCTACGGCGACATGGAGAACAAGCTGTTTGCGGGGATTCGGCGGGACGGGC 

2581 + + + + + + 2640 

ACACGATGCCGCTGTACCTCTTGTTCGACAAACGCCCCTAAGCCGCCCTGCCCGACGAGG 

a CATATWRTSCLRGFGGTGC S 

b VLRRHGEQAVCGDSAGRAAP 
c CYGDMENKLFAG I RRDGLLL- 

TGCGTTTGGTGGATGATTTCTTGTTGGTGACACCTC^CCTCACCCACGCGAAAACCTTCC 

2641 + + + + + ' + 2700 

ACGGAAACCACCTACTAAAGAACAACCACTG 

a CVWWMISCW*HLTSPTRKPS 

b AFGG*FLVGDTSPHPRENLP- 

c RLVDDFLLVTPHLTHAKTFL- 

TCAGGACCCTGGTCCGAGGTGTCCCTGAGTATGGCTGCGTGGTGAACTTGCGGAAGACAG 

2701 + + + + + + 2760 

AGTCCTGGGACCAGGCTCCACAGGGACTCATACCGACGCACCACTTGAACGCCTTCTGTC 

a SGPWSEVSLSMAAW*TCGRQ 

b QDPGPRCP *VWLRGELAEDS 

C RTLVRGVPEYGCVVNLRKTV- 

TGGTGAACTTCCCTGTAGAAGACGAGGCCCTGGGTGGCACGGCTTTTGTTCAGATGCCGG 

2761 + + + + + + 2820 

ACCACTTGAAGGGACATCTTCTGCTCCGGGACCCACCGTGCCGAAAACAAGTCTACGGCC 

a W* TSL* KTRPWVARLLFRCR 

b GELPCRRRGPGWHGFCSDAG- 

C VNF PVEDEALGGTAFVQMPA- 

CCCACGGCCTATTCCCCTGGTGCGGCCTGCTGCTGGATACCCGGACCCTGGAGGTGCAGA 

2821 + + + + + + 2880 

GGGTGCCGGATAAGGGGACCACGCCGGACGACGACCTATGGGCCTGGGACCTCCACGTCT 

a PTAYSPGAACCWIPGPWRCR 

b PRPIPLVRPAAGYPDPGGAE 

C HGLFPWCGLLLDTRTLEVQS- 

GCGACTACTCCAGCTATGCCCGGACCTCCATCAGAGCCAGTCTCACCTTCAACCGCGGCT 

2881 + + + + + + 2940 

CGCTGATGAGGTCGATACGGGCCTGGAGGTAGTCTCGGTCAGAGTGGAAGTTGGCGCCGA 
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a ATTPAMPGPPSEPVSPSTAA 

b RLLQLCPDLHQSQSHLQPRL- 

C DYSSYARTS I RASLTFNRGF- 

TCAAGGCTGGGAGGAACATGCGTCGCAAACTCTTTGGGGT 

2941 + + + + + + 3000 

AGTTCCGACCCTCCTTGTACGCAGCGTTTGAGAAACCC 

a SRLGGTCVANSLGSCG* SVT 

b QGWEEHASQTLWGLAAEVSQ- 

C KAGRNMRRKL FGVLRL KCH S - 

GCCTGTTTCTGGATTTGCAGGTGAACAGCCTCCA^ 

3001 + + + + + '+ 3060 

CGGACAAAGACCTAAACGTCCACTTGTCGGAGGTCTGCCACACGTGGTTGTAGATGTTCT 

a ACFWICR*TASRRCAPTSTR 

b PVSGFAGEQPPDGVHQHLQD 

c LFLDLQVNSLQTVCTNIYKI- 

TCCTCCTGCTGCAGGCGTACAGGTTTCACGCATGTGTGCTGCAGCTCCCATTTCATCAGC 

3061 + + + + + + 3120 

AGGAGGACGACGTCCGCATGTCCAAAGTGCGTACACACGACGTCGAGGGTAAAGTAGTCG 

a SSCCRRTGFTHVCCSSHFIS 

b PPAAGVQVSRMCAAAPISSA- 

C LLLQAYRFHACVLQLPFHQQ- 

AAGTTTGGAAGAACCCCACATTTTTCCTGCGCGTCATCTCTGACACGGCCTCCCTCTGCT 

3121 + + + + + + 3180 

TTCAAACCTTCTTGGGGTGTAAAAAGGACGCGCAGTAGAGACTGTGCCGGAGGGAGACGA 

a KFGRTPHFSCASSLTRPPSA 

b SLEEPHI FPARHL*HGLPLL 

C VWKNPTFFLRVI SDTASLCY- 

ACTCCATCCTGAAAGCCAAGAACGCAGGGATGTCGCTGGGGGCCAAGGGCGCCGCCGGCC 

3181 + + + + + + 3240 

TGAGGTAGGACTTTCGGTTCTTGCGTCCCTACAGCGACCCCCGGTTCCCGCGGCGGCCGG 

a TPS * KPRTQGCRWGPRAPPA 

b LHPESQERRDVAGGQGRRRP- 

C S I LKAKNAGM-S LGAKGAAGP- 

CTCTGCCCTCCGAGGCCGTGCAGTGGCTGTGCCACCAAGCATTCCTGCTCAAGCTGACTC 

3241 + + + + + + 3300 

GAGACGGGAGGCTCCGGCACGTCACCGACACGGTGGTTCGTAAGGACGAGTTCGACTGAG 

a LCPPRPCSGCATKHSCSS*L 

b SALRGRAVAVPPS I PAQADS 

C LPSEAVQWLCHQAFLLKLTR- 

GACACCGTGTCACCTACGTGCCACTCCTGGGGTCACTCAGGACAGCCCAGACGCAGCTGA 

3301 + + + + + + 3360 

CTGTGGCACAGTGGATGCACGGTGAGGACCCCAGTGAGTCCTGTCGGGTCTGCGTCGACT 

a DTVSPTCHSWGHSGQPRRS. * 

b TPCHLRATPGVTQDSPDAAE 

C HRVTYVPLLGSLRTAQTQLS- 

GTCGGAAGCTCCCGGGGACGACGCTGACTGCCCTGGAGGCCGCAGCC^CCCGGCACTGC 

3361 + + + + + + 3420 

CAGCCTTCGAGGGCCCCTGCTGCGACTGACGGGACCTCCGGCGTCGGTTGGGCCGTGACG 
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5 2D04 



a 
b 
c 



3421 



VGSSRGRR*LPWRPQPTRHC 
SEAPGDDADCPGGRSQPGTA 
RKLPGTTLTALEAAANPALP- 

CCTC^GACTTC^GACCATCCTGGACTGATGGCCACCCGCCCACAGCCAGGCCGAGAG^ 

+ + + + + + 348O 

GGAGTCTGAAGTTCTGGTAGGACCTGACTACCGGTGGGCGGGTGTCGGTCCGGCTCTCGT 



a 
b 
c 



PQTSRPSWTDGHPPTARPRA 
LRLQDHPGLMATRPQPGREQ 
SDFKTILD*WPPAHSQAESR 



GACACCAGCAGCCCTGTCACGCCGGGCTCTACGTCCCAGGGAGGGAGGGGCGGCCCACAC 

3481 + + + + + + 3540 

CTGTGGTCGTCGGGACAGTGCGGCCCGAGATGCAGGGTCCCTCCCTCCCCGCCGGGTGTG 



a 
b 
c 



DTSSPVTPGSTSQGGRGGPH 
TPAALS RRALRPREGGAAHT 
HQQPCHAGLYVPGREGRPTP 



CCAGGCCCGCACCGCTGGGAGTCTGAGGCCTGAGTGAGTGTTTGGCCGAGGCCTGCATGT 

3541 + + + + + + 3600 

GGTCCGGGCGTGGCGACCCTCAGACTCCGGACTCACTCACAAACCGGCTCCGGACGTACA 



a 
b 
c 



PGPHRWESEA*VSVWPRPAC 
QARTAGSLRPE*VFGRGLHV- 
RPAPLGV* GLSECLAEACMS- 



CCGGCTGAAGGCTGAGTGTCCGGCTGAGGCCTGAGCGAGTGTCCAGCCAAGGGCTGAGTG 

3601 + + + + + + 3660 

GGCCGACTTCCGACTCACAGGCCGACTCCGGACTCGCTCACAGGTCGGTTCCCGACTCAC 



a 
b 
c 



PAEG*VSG*GLSECPAKG*V 
RLKAEC PAEA*ASVQPRAEC 
G* RLSVRLRPERVSSQGLSV- 



TCCAGCACACCTGCCGTCTTCACTTCCCCACAGGCTGGCGCTCGGCTCCACCCCAGGGCC 

3661 + + + + + + 3720 

AGGTCGTGTGGACGGCAGAAGTGAAGGGGTGTCCGACCGCGAGCCGAGGTGGGGTCCCGG 



a 
b 
c 



SSTPAVFTSPQAGARLHPRA 
PAHLPS SLPHRLALGSTPGP 
QHTCRLHFPTGWRSAPPQGQ 



AGCTTTTCCTCACCAGGAGCCCGGCTTCCACTCCCCACATAGGAATAGTCCATCCCCAGA 

3721 + + + + + + 3780 

TCGAAAAGGAGTGGTCCTCGGGCCGAAGGTGAGGGGTGTATCCTTATCAGGTAGGGGTCT 



a 
b 
c 



SFSSPGARLPLPT*E*SIPR 
AFPHQEPGFHSPHRNSPSPD- 
LFLTRSPASTPHIGIVHPQI- 



TTCGCCATTGTTCACCCCTCGCCCTGCCCTCCTTTGCCTTCCACCCCCACCATCCAGGTG 

3781 + + + + + + 3840 

AAGCGGTAACAAGTGGGGAGCGGGACGGGAGGAAACGGAAGGTGGGGGTGGTAGGTCCAC 



a 
b 
c 



FAIVHPSPCPPLPSTPTIQV 
SPLFTPRPALLCLPPPPSRW- 
RHCS PLALPSFAFHPHHPGG- 



GAGACCCTGAGAAGGACCCTGGGAGCTCTGGGAATTTGGAGTGACCAAAGGTGTGCCCTG 

3841 + + + + + -f 3900 

CTCTGGGACTCTTCCTGGGACCCTCGAGACCCTTAAACCTCACTGGTTTCCACACGGGAC 



F/G. 72H 



+ 




a ETLRRTLGALGIWSDQRCAL 

b RP* EGPWELWEFGVTKGVPC 

C DPEKDPGSSGNLE*PKVCPV- 

TACACAGGCGAGGACCCTGCACCTGGATGGGGGTCCCTGTGGGTCAAATTGGGGGGAGGT 

3901 + + + + + + 3960 

ATGTGTCCGCTCCTGGGACGTGGACCTACCCCCAGGGACACCCAGTTTAACCCCCCTCCA 

a YTGEDPAPGWGSLWVKLGGG 

b TQARTLHLDGGPCGSNWGEV- 

C HRRGPCTWMGVPVGQI G G R C - 

GCTGTGGGAGTAAAATACTGAATATATGAGTTTTTCAGTTTTGA 

3961 + + + + + + 4020 

CGACACCCTCATTTTATGACTTATATACTCAAAAAGTC 

a AVGVKY* IYEFFSFEKKKKK 

b LWE *NTEYMS FSVLKKKKKK- 

c CGSKILNI *VFQF*KKKKKK- 

AAAAAAAAA 

4021 4029 

TTTTTTTTT 

a K K K 

b K K 

C K K 
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i 

met 

GCAGCGCTGCGTCCTGCTGCGCACGTGGGAAGCCCTGGCCCCGGCCACCCCCGCG ATG 

10 

pro arg ala pro arg cys arg ala val arg ser leu leu arg ser 
CCG CGC GCT CCC CGC TGC CGA GCC GTG CGC TCC CTG CTG CGC AGC 

20 30 
his tyr arg glu val leu pro leu ala thr phe val arg arg leu 
CAC TAC CGC GAG GTG CTG CCG CTG GCC ACG TTC GTG CGG CGC CTG 

40 

gly pro gin gly trp arg leu val gin arg gly asp pro ala ala 
GGG CCC CAG GGC TGG CGG CTG GTG CAG CGC GGG GAC CCG GCG GCT 

50 60 
phe arg ala leu val ala gin cys leu val cys val pro trp asp 
TTC CGC GCG CTG GTG GCC CAG TGC CTG GTG TGC GTG CCC TGG GAC 

70 

ala arg pro pro pro ala ala pro ser phe arg gin val ser cys 
GCA CGG CCG CCC CCC GCC GCC CCC TCC TTC CGC CAG GTG TCC TGC 

80 90 
leu lys glu leu val ala arg val leu gin arg leu cys glu arg 
CTG AAG GAG CTG GTG GCC CGA GTG CTG CAG AGG CTG TGC GAG CGC 

100 

gly ala lys asn val leu ala phe gly phe ala leu leu asp gly 
GGC GCG AAG AAC GTG CTG GCC TTC GGC TTC GCG CTG CTG GAC GGG 

110 120 
ala arg gly gly pro pro glu ala phe thr thr ser val arg ser 
GCC CGC GGG GGC CCC CCC GAG GCC TTC ACC ACC AGC GTG CGC AGC 

130 

tyr leu pro asn thr val thr asp ala .leu arg gly ser gly ala 
TAC CTG CCC AAC ACG GTG ACC GAC GCA CTG CGG GGG AGC GGG GCG 

140 150 
trp gly leu leu leu arg arg val gly asp asp val leu val his 
TGG GGG CTG CTG CTG CGC CGC GTG GGC GAC GAC GTG CTG GTT CAC 

160 

leu leu ala arg cys ala leu phe val leu val ala pro ser cys 
CTG CTG GCA CGC TGC GCG CTC TTT GTG CTG GTG GCT CCC AGC TGC 

170 180 
ala tyr gin val cys gly pro pro leu tyr gin leu gly ala ala 
GCC TAC CAG GTG TGC GGG CCG CCG CTG TAC CAG CTC GGC GCT GCC 

190 

thr gin ala arg pro pro pro his ala ser gly pro arg arg arg 
ACT CAG GCC CGG CCC CCG CCA CAC GCT AGT GGA CCC CGA AGG CGT 
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leu 
CTG 


gly 
GGA 


cys 
TGC 


glu 
GAA 


arg 
CGG 


ala 
GCC 


trp 
TGG 


asn 
AAC 


his 
CAT 


ser 
AGC 


val 
GTC 


arg 
AGG 


glu 
GAG 


ala 
GCC 


gly 
GGG 


val 
GTC 


pro 

ccc 


leu 
CTG 


gly 
GGC 


leu 
CTG 


pro 
CCA 


ala 
GCC 


pro 
CCG 


220 
gly 
GGT 


ala 
GCG 


arg 
AGG 


arg 
AGG 


arg 
CGC 


gly 
GGG 


gly 
GGC 


ser 
AGT 


ala 
GCC 


ser 
AGC 


230 
arg 
CGA 


ser 
AGT 


leu 
CTG 


pro 
CCG 


leu 
TTG 


pro 
CCC 


lys 
AAG 


arg 
AGG 


pro 
CCC 


arg 
AGG 


240 
arg 
CGT 


giy 

GGC 


ala 
GCT 


ala 
GCC 


pro 
CCT 


glu 
GAG 


pro 
CCG 


glu 
GAG 


arg 
CGG 


thr 
ACG 


250 
pro 
CCC 


val 
GTT 


gly 
GGG 


gin 
CAG 


gly 
GGG 


ser 
TCC 


trp 
TGG 


ala 
GCC 


his 
CAC 


pro 
CCG 


260 
gly 
GGC 


arg 
AGG 


thr 
ACG 


arg 
CGT 


gly 
GGA 


pro 
CCG 


ser 
AGT 


asp 
GAC 


arg 
CGT 


gly 
GGT 


270 
phe 
TTC 


cys 
TGT 


val 
GTG 

gly 
GGT 


val 
GTG 

ala 
GCG 


ser 
TCA 

leu 
CTC 


pro 
CCT 
2 90 
ser 
TCT 


ala 
GCC 

gly 
GGC 


arg 
AGA 

thr 
ACG 


pro 
CCC 

arg 
CGC 


ala 
GCC 

his 
CAC 


280 
glu 
GAA 

ser 
TCC 


glu 
GAA 

his 
CAC 


ala 
GCC 

pro 
CCA 


thr 
ACC 

ser 
TCC 


ser 
TCT 

val 
GTG 


leu 
TTG 
3 00 

giy 

GGC 


glu 
GAG 

arg 
CGC 


gin 
CAG 


his 
CAC 


his 
CAC 


ala 
GCG 


gly 
GGC 


pro 
CCC 


pro 
CCA 


ser 
TCC 


310 
thr 
ACA 


ser 
TCG 


arg 
CGG 


pro 
CCA 


pro 
CCA 


arg 
CGT 


pro 
CCC 


trp 
TGG 


asp 
GAC 


thr 
ACG 


320 
pro 
CCT 


cys 
TGT 


pro 
CCC 


pro 
CCG 


val 
GTG 


tyr 
TAC 


ala 
GCC 


glu 
GAG 


thr 
ACC 


lys 
AAG 


33 0 
his 
CAC 


phe 
TTC 


leu 
CTC 


tyr 
TAC 


ser 
TCC 


ser 
TCA 


gly 
GGC 


asp 
GAC 


lys 
AAG 


glu 
GAG 


340 
gin 
CAG 


leu 
CTG 


arg 
CGG 


pro 
CCC 


ser 
TCC 


phe 
TTC 


leu 
CTA 


leu 
CTC 


ser 
AGC 


ser 
TCT 


350 
leu 
CTG 


arg 
AGG 


pro 
CCC 


ser 
AGC 


leu 
CTG 


thr 
ACT 


gly 
GGC 


ala 
GCT 


arg 
CGG 


arg 
AGG 


360 
leu 
CTC 


val 
GTG 


glu 

GAG 


thr 
ACC 


ile 
ATC 


phe 
TTT 


leu 
CTG 


gly 
GGT 


ser 
TCC 


arg 
AGG 


370 
pro 
CCC 


trp 
TGG 


met 
ATG 


pro 
CCA 


gly 
GGG 


thr 
ACT 


pro 
CCC 


arg 
CGC 


arg 
AGG 


leu 
TTG 


380 
pro 
CCC 


arg 
CGC 


leu 
CTG 


pro 
CCC 


gin 
CAG 


arg 
CGC 


tyr 
TAC 


trp 
TGG 


gin 
CAA 


met 
ATG 


390 
arg 
CGG 


pro 
CCC 


leu 
CTG 


phe 
TTT 


leu 
CTG 


glu 
GAG 


leu 
CTG 


leu 
CTT 


giy 

GGG 


asn 
AAC 


400 
his 
CAC 


ala 
GCG 


gin 
CAG 


cys 
TGC 


pro 
CCC 


tyr 
TAC 


gly 
GGG 


val 
GTG 


leu 
CTC 


leu 
CTC 


410 
lys 
AAG 


thr 
ACG 


his 
CAC 


cys 
TGC 


pro 
CCG 


leu 
CTG 


arg 
CGA 


ala 
GCT 


ala 
GCG 


val 
GTC 


420 
thr 
ACC 


pro 
CCA 
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ala ala gly 
GCA GCC GGT 



ala pro glu 
GCC CCC GAG 



leu arg gin 
CTC CGC CAG 



ala cys leu 
GCC TGC CTG 



his asn glu 
CAC AAC GAA 



leu gly lys 
CTG GGG AAG 



met ser val 
ATG AGC GTG 



gly cys val 
GGC TGT GTT 



ala lys phe 
GCC AAG TTC 



leu arg ser 
CTC AGG TCT 



arg leu phe 
AGG CTC TTT 



ile gly ile 
ATT GGA ATC 

ser glu ala 
TCG GAA GCA 



leu thr ser 
CTG ACG TCC 



pro ile val 
CCG ATT GTG 



val cys ala 
GTC TGT GCC 

440 

glu glu asp 
GAG GAG GAC 



his ser ser 
CAC AGC AGC 

470 

arg arg leu 
CGC CGG CTG 



arg arg phe 
CGC CGC TTC 

500 

his ala lys 
CAT GCC AAG 



arg asp cys 
CGG GAC TGC 

530 

pro ala ala 
CCG GCC GCA 



leu his trp 
CTG CAC TGG 

560 

phe phe tyr 
TTC TTT TAT 



phe tyr arg 
TTC TAC CGG 

590 

arg gin his 
AGA CAG CAC 

glu val arg 
GAG GTC AGG 

620 

arg leu arg 
AGA CTC CGC 



asn met asp 
AAC ATG GAC 



arg 
CGG 


430 
glu lys 
GAG AAG 


thr 
ACA 


asp 
GAC 


pro 
CCC 


pro 
CCC 


trp 
TGG 


460 
gin 
CAG 


val 
GTG 


nro 
CCC 


pro 
CCA 


1 eu 
CTC 


arg 
AGG 


490 
asn 
AAC 


leu 
CTC 


ser 
TCG 


1 eu 
CTG 


ala 
GCT 


trp 
TGG 


520 
leu 
CTG 


glu 
GAG 


hi s 
CAC 


arcr 
CGT 


leu 
CTG 


met 
ATG 


550 
ser 
AGT 


val 
GTC 


thr 
ACG 


glu 
GAG 


pro 
CCG 


ser 
AGT 


580 
val 
GTC 


leu 
TTG 

gin 
CAG 


lys 
AAG 

his 
CAT 


arg 
AGG 
610 
arg 
CGG 


phe 
TTC 


ile 
ATC 


pro 
CCC 


tyr 
TAC 


val 
GTC 


640 
val 
GTG 



pro gin gly 
CCC CAG GGC 



arg arg leu 
CGT CGC CTG 



val tyr gly 
GTG TAC GGC 



gly leu trp 
GGC CTC TGG 



thr lys lys 
ACC AAG AAG 



gin glu leu 
CAG GAG CTG 



arg arg ser 
CGC AGG AGC 



leu arg glu 
CTG CGT GAG 



val tyr val 
GTG TAC GTC 



thr thr phe 
ACC ACG TTT 



trp ser lys 
TGG AGC AAG 



val gin leu 
GTG CAG CTG 

glu ala arg 
GAA. GCC AGG 



lys pro asp 
AAG CCT GAC 



gly ala arg 
GGA GCC AGA 



ser val ala 
TCT GTG GCG 

450 
val gin leu 
GTG CAG CTG 



phe val arg 
TTC GTG CGG 

480 
gly ser arg 
GGC TCC AGG 



phe ile ser 
TTC ATC TCC 

510 
thr trp lys 
ACG TGG AAG 



pro gly val 
CCA GGG GTT 

540 

glu ile leu 
GAG ATC CTG 



val glu leu 
GTC GAG CTG 

570 

gin lys asn 
CAA AAG AAC 



leu gin ser 
TTG CAA AGC 

600 
arg glu leu 
CGG GAG CTG 

pro ala leu 
CCC GCC CTG 

630 

gly leu arg 
GGG CTG CGG 



thr phe arg 
ACG TTC CGC 
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arg glu lys 
AGA GAA AAG 



phe ser val 
TTC AGC GTG 



gly ala ser 
GGC GCC TCT 



thr phe val 
ACC TTC GTG 



tyr phe val 
TAC TTT GTC 



gin asp arg 
CAG GAC AGG 



asn thr tyr 
AAC ACG TAC 



his gly his 
CAT GGG CAC 



thr asp leu 
ACA GAC CTC 



glu thr ser 
GAG ACC AGC 



ser leu asn 
TCC CTG AAT 



phe met cys 
TTC ATG TGC 



gin cys gin 
CAG TGC CAG 



cys ser leu 
TGC AGC CTG 



ile arg arg 
ATT CGG CGG 



;bo 

arg ala glu 
AGG GCC GAG 



leu asn tyr 
CTC AAC TAC 

680 

val leu gly 
GTG CTG GGC 



leu arg val 
CTG CGT GTG 

710 

lys val asp 
AAG GTG GAT 



leu thr glu 
CTC ACG GAG 

740 

cys val arg 
TGC GTG CGT 



val arg lys 
GTC CGC AAG 

770 

gin pro tyr 
CAG CCG TAC 



pro leu arg 
CCG CTG AGG 

800 

glu ala ser 
GAG GCC AGC 



his his ala 
CAC CAC GCC 

830 

gly ile pro 
GGG ATC CCG 



cys tyr gly 
TGC TAC GGC 

860 

asp gly leu 
GAC GGG CTG 



arg leu thr 
CGT CTC ACC 

670 

glu arg ala 
GAG CGG GCG 



leu asp asp 
CTG GAC GAT 

700 

arg ala gin 
CGG GCC CAG 



val thr gly 
GTG ACG GGC 

730 

val ile ala 
GTC ATC GCC 



arg tyr ala 
CGG TAT GCC 

760 

ala phe lys 
GCC TTC AAG 



met arg gin 
ATG CGA CAG 

790 

asp ala val 
GAT GCC GTC 



ser gly leu 
AGT GGC CTC 

820 

val arg ile 
GTG CGC ATC 



gin gly ser 
CAG GGC TCC 

850 

asp met glu 
GAC ATG GAG 



leu leu arg 
CTC CTG CGT 



ser, arg val 
TCG AGG GTG 



arg arg pro 
CGG CGC CCC 



ile his arg 
ATC CAC AGG 



asp pro pro 
GAC CCG CCG 



ala tyr asp 
GCG TAC GAC 



ser ile ile 
AGC ATC ATC 



val val gin 
GTG GTC CAG 



ser his val 
AGC CAC GTC 



phe val ala 
TTC GTG GCT 



val ile glu 
GTC ATC GAG 



phe asp val 
TTC GAC GTC 



arg gly lys 
AGG GGC AAG 



ile leu ser 
ATC CTC TCC 



asn lys leu 
AAC AAG CTG 



leu val asp 
TTG GTG GAT 



660 
lys ala leu 
AAG GCA CTG 



gly leu leu 
GGC CTC CTG 

690 

ala trp arg 
GCC TGG CGC 



pro glu leu 
CCT GAG CTG 

720 
thr ile pro 
ACC ATC CCC 



lys pro gin 
AAA CCC CAG 

750 
lys ala ala 
AAG GCC GCC 



ser thr leu 
TCT ACC TTG 

780 

his leu gin 
CAC CTG CAG 



gin ser ser 
CAG AGC TCC 

810 

phe leu arg 
TTC CTA CGC 



ser tyr val 
TCC TAC GTC 

840 
thr leu leu 
ACG CTG CTC 



phe ala gly 
TTT GCG GGG 

870 
asp phe leu 
GAT TTC TTG 
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leu val thr 
TTG GTG ACA 



leu val arg 
CTG GTC CGA 



lys thr val 
AAG ACA GTG 



thr ala phe 
ACG GCT TTT 

gly leu leu 
GGC CTG CTG 



ser ser tyr 
TCC AGC TAT 



arg gly phe 
CGC GGC TTC 



val leu arg 
GTC TTG CGG 



asn ser leu 
AAC AGC CTC 



leu gin ala 
CTG CAG GCG 



his gin gin 
CAT CAG CAA 



ser asp thr 
TCT GAC ACG 



ala gly met 
GCA GGG ATG 



ser glu ala 
TCC GAG GCC 



leu thr arg 
CTG ACT CGA 



pro his leu 
CCT CAC CTC 

890 

gly val pro 
GGT GTC CCT 



val asn phe 
GTG AAC TTC 

920 

val gin met 
GTT CAG ATG 

leu asp thr 
CTG GAT ACC 

950 

ala arg thr 
GCC CGG ACC 



lys ala gly 
AAG GCT GGG 

980 

leu lys cys 
CTG AAG TGT 



gin thr val 
CAG ACG GTG 

1010 

tyr arg phe 
TAC AGG TTT 



val trp lys 
GTT TGG AAG 

1040 

ala ser leu 
GCC TCC CTC 



ser leu gly 
TCG CTG GGG 

1070 

val gin trp 
GTG CAG TGG 



his arg val 
CAC CGT GTC 



880 

thr his ala 
ACC CAC GCG 



glu tyr gly 
GAG TAT GGC 

910 

pro val glu 
CCT GTA GAA 



pro ala his 
CCG GCC CAC 
940 

arg thr leu 
CGG ACC CTG 



ser ile arg 
TCC ATC AGA 

970 

arg asn met 
AGG AAC ATG 



his ser leu 
CAC AGC CTG 

100 

cys thr asn 
TGC ACC AAC 



his ala cys 
CAC GCA TGT 

103i 

asn pro thr 
AAC CCC ACA 



cys tyr ser 
TGC TAC TCC 

106 

ala lys gly 
GCC AAG GGC 



leu cys his 
CTG TGC CAC 

109 

thr tyr val 
ACC TAC GTG 



lys 
AAA 


thr 
ACC 


phe 
TTC 


cys 
TGC 


val 
GTG 


val 
GTG 


asp 
GAC 


glu 
GAG 


ala 
GCC 


gly 
GGC 


leu 
CTA 


phe 
TTC 


glu 
GAG 


val 
GTG 


gin 
CAG 


ala 
GCC 


ser 
AGT 


val 
GTC 


arg 
CGT 


arg 
CGC 


lys 
AAA 


phe 
TTT 


leu 
CTG 


asp 
GAT 


ile 
ATC 


tyr 
TAC 


lys 
AAG 


val 
GTG 


leu 
CTG 


gin 
CAG 


\ 
} 

phe 
TTT 


phe 
TTC 


leu 
CTG 


ile 
ATC 


leu 
CTG 


lys 
AAA 


) 

ala 
GCC 


ala 
GCC 


gly 
GGC 


gin 
CAA 


ala 
GCA 


phe 
TTC 


) 

pro 
CCA 


leu 
CTC 


leu 
CTG 



leu arg thr 
CTC AGG ACC 

900 

asn leu arg 
AAC TTG CGG 



leu gly gly 
CTG GGT GGC 

930 

pro trp cys 
CCC TGG TGC 

ser asp tyr 
AGC GAC TAC 

960 

thr phe asn 
ACC TTC AAC 



leu phe gly 
CTC TTT GGG 

990 
leu gin val 
TTG CAG GTG 



ile leu leu 
ATC CTC CTG 

1020 
leu pro phe 
CTC CCA TTT 



arg val ile 
CGC GTC ATC 

1050 
ala lys asn 
GCC AAG AAC 



pro leu pro 
CCT CTG CCC 

1080 
leu leu lys 
CTG CTC AAG 



gly ser leu 
GGG TCA CTC 



FIG. 74E 



103/103 



1100 1110 
arg thr ala gin thr gin leu ser arg lys leu pro gly thr thr 
AGG ACA GCC CAG ACG CAG CTG AGT CGG AAG CTC CCG GGG ACG ACG 

1120 

leu thr ala leu glu ala ala ala asn pro ala leu pro ser asp 
CTG ACT GCC CTG GAG GCC GCA GCC AAC CCG GCA CTG CCC TCA GAC 

1130 1132 
phe lys thr ile leu asp OP 

TTC AAG ACC ATC CTG GAC TGA TGG CC AC C CG C C C AC AG C C AGG C CGAGAG CAGA 

CACCAGCAGCCCTGTCACGCCGGGCTCTACGTCCCAGGGAGGGAGGGGCGGCCCACACCC 

AGGCCCGCACCGCTGGGAGTCTGAGGCCTGAGTGAGTGTTTGGCCGAGGCCTGCATGTCC 

GGCTGAAGGCTGAGTGTCCGGCTGAGGCCTGAGCGAGTGTCCAGCCAAGGGCTGAGTGTC 

CAGCACACCTGCCGTCTTCACTTCCCCACAGGCTGGCGCTCGGCTCCACCCCAGGGCCAG 

CTTTTCYTCACCAGGAGCCCGGCTTCCACTCCCCACATAGGAATAGTCCATCCCCAGATT 

CGCCATTGTTCACCCYTCGCCCTGCCYTCCTTTGCCTTCCACCCCCACCATCCAGGTGGA 

GACCCTGAGAAGGACCCTGGGAGCTCTGGGAATTTGGAGTGACCAAAGGTGTGCCCTGTA 

CACAGGCGAGGACCCTGCACCTGGATGGGGGTCCCTGTGGGTCAAATTGGGGGGAGGTGC 

TGTGGGAGTAAAATACTGAATATATGAGTTTTTCAGTTTTGRAAAAAAAAAAAAAAAAAA 

AAAAAAAAAA 
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